无法使多进程同时运行进程

def run_normalizers(config, debug, num_threads, name=None): def _run(): print('Started process for normalizer') sqla_engine = init_sqla_from_config(config) image_vfs = create_s3vfs_from_config(config, config.AWS_S3_IMAGE_BUCKET) storage_vfs = create_s3vfs_from_config(config, config.AWS_S3_STORAGE_BUCKET) pp = PipedPiper(config, image_vfs, storage_vfs, debug=debug) if name: pp.run_pipeline_normalizers(name) else: pp.run_all_normalizers() print('Normalizer process complete') threads = [] for i in range(num_threads): threads.append(multiprocessing.Process(target=_run)) [t.start() for t in threads] [t.join() for t in threads] run_normalizers(...)

2条回答

网友

1楼 · 编辑于 2024-10-17 06:18:10

如果您仍在寻找一个多处理解决方案，您可能首先想看看如何使用一个worker池，然后您就不必自己管理num_threads进程：http://docs.python.org/2/library/multiprocessing.html#using-a-pool-of-workers

对于减速问题，您是否尝试过将config对象作为参数传递给\u run函数？我不知道这是否/如何在内部产生改变，但我猜测它可能会改变一些东西。在

网友

2楼 · 编辑于 2024-10-17 06:18:10

修复了我的多处理问题-并实际切换了线程。我不知道到底是什么修复了它的想法-我只是重新设计了所有的东西，让工人和任务，什么不做，事情现在都在飞。以下是我所做的基本工作：

import abc
from Queue import Empty, Queue
from threading import Thread

class AbstractTask(object):
    """
        The base task
    """
    __metaclass__ = abc.ABCMeta

    @abc.abstractmethod
    def run_task(self):
        pass

class TaskRunner(object):

    def __init__(self, queue_size, num_threads=1, stop_on_exception=False):
        super(TaskRunner, self).__init__()
        self.queue              = Queue(queue_size)
        self.execute_tasks      = True
        self.stop_on_exception  = stop_on_exception

        # create a worker
        def _worker():
            while self.execute_tasks:

                # get a task
                task = None
                try:
                    task = self.queue.get(False, 1)
                except Empty:
                    continue

                # execute the task
                failed = True
                try:
                    task.run_task()
                    failed = False
                finally:
                    if failed and self.stop_on_exception:
                        print('Stopping due to exception')
                        self.execute_tasks = False
                    self.queue.task_done()

        # start threads
        for i in range(0, int(num_threads)):
            t = Thread(target=_worker)
            t.daemon = True
            t.start()


    def add_task(self, task, block=True, timeout=None):
        """
            Adds a task
        """
        if not self.execute_tasks:
            raise Exception('TaskRunner is not accepting tasks')
        self.queue.put(task, block, timeout)


    def wait_for_tasks(self):
        """
            Waits for tasks to complete
        """
        if not self.execute_tasks:
            raise Exception('TaskRunner is not accepting tasks')
        self.queue.join()

我所要做的就是创建一个TaskRunner并向其添加任务（数千个），然后调用wait_for_tasks（）。所以，很明显，在我所做的重新架构中，我“修复”了我遇到的其他一些问题。不过很奇怪。在

相关问题更多 >

编程相关推荐

热门问题

热门文章