| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | # Copyright 2009 Brian Quinlan. All Rights Reserved. | 
					
						
							|  |  |  | # Licensed to PSF under a Contributor Agreement. | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | """Implements ThreadPoolExecutor.""" | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | __author__ = 'Brian Quinlan (brian@sweetapp.com)' | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | import atexit | 
					
						
							|  |  |  | from concurrent.futures import _base | 
					
						
							| 
									
										
										
										
											2017-06-21 23:41:13 -07:00
										 |  |  | import itertools | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | import queue | 
					
						
							|  |  |  | import threading | 
					
						
							|  |  |  | import weakref | 
					
						
							| 
									
										
										
										
											2014-09-02 10:39:18 -07:00
										 |  |  | import os | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | # Workers are created as daemon threads. This is done to allow the interpreter | 
					
						
							|  |  |  | # to exit when there are still idle threads in a ThreadPoolExecutor's thread | 
					
						
							|  |  |  | # pool (i.e. shutdown() was not called). However, allowing workers to die with | 
					
						
							|  |  |  | # the interpreter has two undesirable properties: | 
					
						
							| 
									
										
										
										
											2016-08-30 10:47:49 -07:00
										 |  |  | #   - The workers would still be running during interpreter shutdown, | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | #     meaning that they would fail in unpredictable ways. | 
					
						
							|  |  |  | #   - The workers could be killed while evaluating a work item, which could | 
					
						
							|  |  |  | #     be bad if the callable being evaluated has external side-effects e.g. | 
					
						
							|  |  |  | #     writing to a file. | 
					
						
							|  |  |  | # | 
					
						
							|  |  |  | # To work around this problem, an exit handler is installed which tells the | 
					
						
							|  |  |  | # workers to exit when their work queues are empty and then waits until the | 
					
						
							|  |  |  | # threads finish. | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2011-03-26 19:29:44 +01:00
										 |  |  | _threads_queues = weakref.WeakKeyDictionary() | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | _shutdown = False | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | def _python_exit(): | 
					
						
							|  |  |  |     global _shutdown | 
					
						
							|  |  |  |     _shutdown = True | 
					
						
							| 
									
										
										
										
											2011-03-26 19:29:44 +01:00
										 |  |  |     items = list(_threads_queues.items()) | 
					
						
							|  |  |  |     for t, q in items: | 
					
						
							|  |  |  |         q.put(None) | 
					
						
							|  |  |  |     for t, q in items: | 
					
						
							|  |  |  |         t.join() | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  | atexit.register(_python_exit) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | class _WorkItem(object): | 
					
						
							|  |  |  |     def __init__(self, future, fn, args, kwargs): | 
					
						
							|  |  |  |         self.future = future | 
					
						
							|  |  |  |         self.fn = fn | 
					
						
							|  |  |  |         self.args = args | 
					
						
							|  |  |  |         self.kwargs = kwargs | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def run(self): | 
					
						
							|  |  |  |         if not self.future.set_running_or_notify_cancel(): | 
					
						
							|  |  |  |             return | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         try: | 
					
						
							|  |  |  |             result = self.fn(*self.args, **self.kwargs) | 
					
						
							| 
									
										
										
										
											2017-08-22 16:50:42 +02:00
										 |  |  |         except BaseException as exc: | 
					
						
							|  |  |  |             self.future.set_exception(exc) | 
					
						
							|  |  |  |             # Break a reference cycle with the exception 'exc' | 
					
						
							|  |  |  |             self = None | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         else: | 
					
						
							|  |  |  |             self.future.set_result(result) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | def _worker(executor_reference, work_queue, initializer, initargs): | 
					
						
							|  |  |  |     if initializer is not None: | 
					
						
							|  |  |  |         try: | 
					
						
							|  |  |  |             initializer(*initargs) | 
					
						
							|  |  |  |         except BaseException: | 
					
						
							|  |  |  |             _base.LOGGER.critical('Exception in initializer:', exc_info=True) | 
					
						
							|  |  |  |             executor = executor_reference() | 
					
						
							|  |  |  |             if executor is not None: | 
					
						
							|  |  |  |                 executor._initializer_failed() | 
					
						
							|  |  |  |             return | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |     try: | 
					
						
							|  |  |  |         while True: | 
					
						
							| 
									
										
										
										
											2011-04-12 17:48:46 +02:00
										 |  |  |             work_item = work_queue.get(block=True) | 
					
						
							|  |  |  |             if work_item is not None: | 
					
						
							|  |  |  |                 work_item.run() | 
					
						
							| 
									
										
										
										
											2012-11-03 15:36:01 +02:00
										 |  |  |                 # Delete references to object. See issue16284 | 
					
						
							|  |  |  |                 del work_item | 
					
						
							| 
									
										
										
										
											2011-04-12 17:48:46 +02:00
										 |  |  |                 continue | 
					
						
							| 
									
										
										
										
											2011-03-26 19:29:44 +01:00
										 |  |  |             executor = executor_reference() | 
					
						
							|  |  |  |             # Exit if: | 
					
						
							|  |  |  |             #   - The interpreter is shutting down OR | 
					
						
							|  |  |  |             #   - The executor that owns the worker has been collected OR | 
					
						
							|  |  |  |             #   - The executor that owns the worker has been shutdown. | 
					
						
							|  |  |  |             if _shutdown or executor is None or executor._shutdown: | 
					
						
							| 
									
										
										
										
											2018-04-10 18:23:14 +01:00
										 |  |  |                 # Flag the executor as shutting down as early as possible if it | 
					
						
							|  |  |  |                 # is not gc-ed yet. | 
					
						
							|  |  |  |                 if executor is not None: | 
					
						
							|  |  |  |                     executor._shutdown = True | 
					
						
							| 
									
										
										
										
											2011-03-26 19:29:44 +01:00
										 |  |  |                 # Notice other workers | 
					
						
							|  |  |  |                 work_queue.put(None) | 
					
						
							|  |  |  |                 return | 
					
						
							|  |  |  |             del executor | 
					
						
							| 
									
										
										
										
											2011-11-11 20:05:50 +01:00
										 |  |  |     except BaseException: | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         _base.LOGGER.critical('Exception in worker', exc_info=True) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  | 
 | 
					
						
							|  |  |  | class BrokenThreadPool(_base.BrokenExecutor): | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  |     Raised when a worker thread in a ThreadPoolExecutor failed initializing. | 
					
						
							|  |  |  |     """
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | class ThreadPoolExecutor(_base.Executor): | 
					
						
							| 
									
										
										
										
											2017-06-21 23:41:13 -07:00
										 |  |  | 
 | 
					
						
							|  |  |  |     # Used to assign unique thread names when thread_name_prefix is not supplied. | 
					
						
							|  |  |  |     _counter = itertools.count().__next__ | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  |     def __init__(self, max_workers=None, thread_name_prefix='', | 
					
						
							|  |  |  |                  initializer=None, initargs=()): | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         """Initializes a new ThreadPoolExecutor instance.
 | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         Args: | 
					
						
							|  |  |  |             max_workers: The maximum number of threads that can be used to | 
					
						
							|  |  |  |                 execute the given calls. | 
					
						
							| 
									
										
										
										
											2016-08-07 10:19:20 -07:00
										 |  |  |             thread_name_prefix: An optional name prefix to give our threads. | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  |             initializer: An callable used to initialize worker threads. | 
					
						
							|  |  |  |             initargs: A tuple of arguments to pass to the initializer. | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         """
 | 
					
						
							| 
									
										
										
										
											2014-09-02 10:39:18 -07:00
										 |  |  |         if max_workers is None: | 
					
						
							|  |  |  |             # Use this number because ThreadPoolExecutor is often | 
					
						
							|  |  |  |             # used to overlap I/O instead of CPU work. | 
					
						
							|  |  |  |             max_workers = (os.cpu_count() or 1) * 5 | 
					
						
							| 
									
										
										
										
											2014-05-17 13:51:10 -07:00
										 |  |  |         if max_workers <= 0: | 
					
						
							|  |  |  |             raise ValueError("max_workers must be greater than 0") | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  |         if initializer is not None and not callable(initializer): | 
					
						
							|  |  |  |             raise TypeError("initializer must be a callable") | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         self._max_workers = max_workers | 
					
						
							| 
									
										
										
										
											2018-01-18 10:38:03 +01:00
										 |  |  |         self._work_queue = queue.SimpleQueue() | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         self._threads = set() | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  |         self._broken = False | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         self._shutdown = False | 
					
						
							|  |  |  |         self._shutdown_lock = threading.Lock() | 
					
						
							| 
									
										
										
										
											2017-06-21 23:41:13 -07:00
										 |  |  |         self._thread_name_prefix = (thread_name_prefix or | 
					
						
							|  |  |  |                                     ("ThreadPoolExecutor-%d" % self._counter())) | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  |         self._initializer = initializer | 
					
						
							|  |  |  |         self._initargs = initargs | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2019-04-01 09:16:35 +03:00
										 |  |  |     def submit(*args, **kwargs): | 
					
						
							|  |  |  |         if len(args) >= 2: | 
					
						
							|  |  |  |             self, fn, *args = args | 
					
						
							|  |  |  |         elif not args: | 
					
						
							|  |  |  |             raise TypeError("descriptor 'submit' of 'ThreadPoolExecutor' object " | 
					
						
							|  |  |  |                             "needs an argument") | 
					
						
							|  |  |  |         elif 'fn' in kwargs: | 
					
						
							|  |  |  |             fn = kwargs.pop('fn') | 
					
						
							|  |  |  |             self, *args = args | 
					
						
							|  |  |  |             import warnings | 
					
						
							|  |  |  |             warnings.warn("Passing 'fn' as keyword argument is deprecated", | 
					
						
							|  |  |  |                           DeprecationWarning, stacklevel=2) | 
					
						
							|  |  |  |         else: | 
					
						
							|  |  |  |             raise TypeError('submit expected at least 1 positional argument, ' | 
					
						
							|  |  |  |                             'got %d' % (len(args)-1)) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         with self._shutdown_lock: | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  |             if self._broken: | 
					
						
							|  |  |  |                 raise BrokenThreadPool(self._broken) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |             if self._shutdown: | 
					
						
							|  |  |  |                 raise RuntimeError('cannot schedule new futures after shutdown') | 
					
						
							| 
									
										
										
										
											2018-04-10 18:23:14 +01:00
										 |  |  |             if _shutdown: | 
					
						
							| 
									
										
										
										
											2018-11-05 16:20:25 +02:00
										 |  |  |                 raise RuntimeError('cannot schedule new futures after ' | 
					
						
							| 
									
										
										
										
											2018-04-10 18:23:14 +01:00
										 |  |  |                                    'interpreter shutdown') | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | 
 | 
					
						
							|  |  |  |             f = _base.Future() | 
					
						
							|  |  |  |             w = _WorkItem(f, fn, args, kwargs) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |             self._work_queue.put(w) | 
					
						
							|  |  |  |             self._adjust_thread_count() | 
					
						
							|  |  |  |             return f | 
					
						
							| 
									
										
										
										
											2019-05-06 22:40:27 +03:00
										 |  |  |     submit.__text_signature__ = _base.Executor.submit.__text_signature__ | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |     submit.__doc__ = _base.Executor.submit.__doc__ | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     def _adjust_thread_count(self): | 
					
						
							| 
									
										
										
										
											2011-03-26 19:29:44 +01:00
										 |  |  |         # When the executor gets lost, the weakref callback will wake up | 
					
						
							|  |  |  |         # the worker threads. | 
					
						
							|  |  |  |         def weakref_cb(_, q=self._work_queue): | 
					
						
							|  |  |  |             q.put(None) | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         # TODO(bquinlan): Should avoid creating new threads if there are more | 
					
						
							|  |  |  |         # idle threads than items in the work queue. | 
					
						
							| 
									
										
										
										
											2016-08-07 10:19:20 -07:00
										 |  |  |         num_threads = len(self._threads) | 
					
						
							|  |  |  |         if num_threads < self._max_workers: | 
					
						
							|  |  |  |             thread_name = '%s_%d' % (self._thread_name_prefix or self, | 
					
						
							|  |  |  |                                      num_threads) | 
					
						
							|  |  |  |             t = threading.Thread(name=thread_name, target=_worker, | 
					
						
							| 
									
										
										
										
											2011-03-26 19:29:44 +01:00
										 |  |  |                                  args=(weakref.ref(self, weakref_cb), | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  |                                        self._work_queue, | 
					
						
							|  |  |  |                                        self._initializer, | 
					
						
							|  |  |  |                                        self._initargs)) | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |             t.daemon = True | 
					
						
							|  |  |  |             t.start() | 
					
						
							|  |  |  |             self._threads.add(t) | 
					
						
							| 
									
										
										
										
											2011-03-26 19:29:44 +01:00
										 |  |  |             _threads_queues[t] = self._work_queue | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2017-11-04 11:05:49 +01:00
										 |  |  |     def _initializer_failed(self): | 
					
						
							|  |  |  |         with self._shutdown_lock: | 
					
						
							|  |  |  |             self._broken = ('A thread initializer failed, the thread pool ' | 
					
						
							|  |  |  |                             'is not usable anymore') | 
					
						
							|  |  |  |             # Drain work queue and mark pending futures failed | 
					
						
							|  |  |  |             while True: | 
					
						
							|  |  |  |                 try: | 
					
						
							|  |  |  |                     work_item = self._work_queue.get_nowait() | 
					
						
							|  |  |  |                 except queue.Empty: | 
					
						
							|  |  |  |                     break | 
					
						
							|  |  |  |                 if work_item is not None: | 
					
						
							|  |  |  |                     work_item.future.set_exception(BrokenThreadPool(self._broken)) | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |     def shutdown(self, wait=True): | 
					
						
							|  |  |  |         with self._shutdown_lock: | 
					
						
							|  |  |  |             self._shutdown = True | 
					
						
							| 
									
										
										
										
											2011-03-26 19:29:44 +01:00
										 |  |  |             self._work_queue.put(None) | 
					
						
							| 
									
										
										
										
											2010-09-18 22:35:02 +00:00
										 |  |  |         if wait: | 
					
						
							|  |  |  |             for t in self._threads: | 
					
						
							|  |  |  |                 t.join() | 
					
						
							|  |  |  |     shutdown.__doc__ = _base.Executor.shutdown.__doc__ |