zl程序教程

您现在的位置是:首页 >  后端

当前栏目

python 并发爬虫的快感

2023-09-14 09:06:37 时间
import time
from tomorrow import threads
from requests_html import HTMLSession
session=HTMLSession()
@threads(50)  # 使用装饰器,这个函数异步执行
def download(url):
    return session.get(url)


def main():
    start = time.time()
    urls = [
        'https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879','https://pypi.org/project/tomorrow/0.2.0/',
        'https://www.cnblogs.com/pyld/p/4716744.html',
        'http://www.xicidaili.com/nn/10',
        'http://baidu.com',
        'http://www.bubuko.com/infodetail-1028793.html?yyue=a21bo.50862.201879'
    ]
    req_list=[]
    for i in urls:
        req_list.append(download(i))
    print(req_list)
    responses = [i.html.xpath("//title/text()") for i in req_list]
    print(responses)
    end = time.time()
    print("Time: %f seconds" % (end - start))


if __name__ == "__main__":
    main()