python 线程池

清华大佬耗费三个月吐血整理的几百G的资源,免费分享!....>>>

# !/usr/bin/env python  
# -*- coding:utf-8 -*-  
  
import Queue  
import threading  
import time  
import re,urllib2
from bs4 import BeautifulSoup
  
class WorkManager(object):  
    def __init__(self, work_num=1000,thread_num=2):  
        self.work_queue = Queue.Queue()  
        self.threads = []  
        self.__init_work_queue(work_num)  
        self.__init_thread_pool(thread_num)  
  
    """ 
        初始化线程 
    """  
    def __init_thread_pool(self,thread_num):  
        for i in range(thread_num):  
            self.threads.append(Work(self.work_queue))  
  
    """ 
        初始化工作队列 
    """  
    def __init_work_queue(self, jobs_num):  
        for i in range(jobs_num):  
            self.add_job(do_job, i,jobs_num)  
  
    """ 
        添加一项工作入队 
    """  
    def add_job(self, func, *args):  
        self.work_queue.put((func, list(args)))
	#任务入队,Queue内部实现了同步机制  
  
    """ 
        等待所有线程运行完毕 
    """     
    def wait_allcomplete(self):  
        for item in self.threads:  
            if item.isAlive():item.join()  
  
class Work(threading.Thread):  
    def __init__(self, work_queue):  
        threading.Thread.__init__(self)  
        self.work_queue = work_queue  
        self.start()  
  
    def run(self):  
        #死循环,从而让创建的线程在一定条件下关闭退出  
        while True:  
            try:  
                do, args = self.work_queue.get(block=False)#任务异步出队,Queue内部实现了同步机制  
                do(args)  
                self.work_queue.task_done()#通知系统任务完成  
            except:  
                break  
  
#具体要做的任务  
def do_job(args):  
    #time.sleep(0.1)#模拟处理时间  
    url = 'http://www.baidu.com'
    page = urllib2.urlopen(url)
    soup = BeautifulSoup(page.read(), "html.parser")
    print soup.title.string,list(args),args[0]
    #print agrs
    #print threading.current_thread(), list(args)  
  
if __name__ == '__main__':  
    start = time.time()  
    '''开始'''
    work_manager =  WorkManager(100, 2)  
    work_manager.wait_allcomplete()  
    end = time.time()  
    print "cost all time: %s" % (end-start)