利用队列及多进程下载音频文件

import requests
import os

def geturllist(queue):
    url = 'https://www.ximalaya.com/revision/play/album?albumId=3423007&pageNum=1&sort=-1&pageSize=30'
    headers = {
        'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.84 Safari/537.36',
        'Referer': 'https://www.ximalaya.com/youshengshu/3423007/',
        'Cookie': 'Hm_lvt_4a7d8ec50cfd6af753c4f8aee3425070=1534755334; Hm_lpvt_4a7d8ec50cfd6af753c4f8aee3425070=1534762050',
    }

    response = requests.get(url, headers=headers)
    res_dict = response.json()
    # print(res_str)
    # print(type(res_str))

    for m4a_ob in res_dict['data']['tracksAudioPlay']:
        url_m = m4a_ob['src']
        # save to queue
        queue.put(url_m)
        # res_m = requests.get(url=url_m,headers=headers)
        # with open('test.m4a','wb') as f:
        #     f.write(res_m.content)
        # break


def download_r(url):
    url_m4a = url
    headers = {
        'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.84 Safari/537.36',
        'Referer': 'https://www.ximalaya.com/youshengshu/3423007/',
        'Cookie': 'Hm_lvt_4a7d8ec50cfd6af753c4f8aee3425070=1534755334; Hm_lpvt_4a7d8ec50cfd6af753c4f8aee3425070=1534762050',
    }
    res_m = requests.get(url=url_m4a, headers=headers)
    filename = url_m4a.split('/')[-1]
    if not os.path.exists('download'):
        os.mkdir('download')
    with open('download/' + filename, 'wb') as f:
        f.write(res_m.content)


if __name__ == '__main__':
    from multiprocessing import Queue
    from multiprocessing import Pool
    import multiprocessing
    queue = Queue()
    p = multiprocessing.Process(target=geturllist, args=(queue,))
    p.start()

    download_pool = Pool(5)
    for i in range(0, 10):
        print(i)
        url_m4a = queue.get()
        download_pool.apply_async(download_r, (url_m4a,))

    download_pool.close()
    download_pool.join()
    p.join()

你可能感兴趣的:(利用队列及多进程下载音频文件)