Python爬虫----------------爬取美食网菜谱(数据库版)

Python爬虫----------------爬取美食网菜谱(数据库版)

import requests
import pymysql
from bs4 import BeautifulSoup
#---------------------------爬取目标网页-----------
def pa():
    indexs = 0
    headers = {
        'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/77.0.3865.90 Safari/537.36'
    }
    # 建立连接
    conn = pymysql.connect(host='localhost', user='root', password='root',db='spiderdb', port=3306, charset='utf8')
    # 建立游标
    cursor = conn.cursor()
    # 数据库操作
    # (1)定义一个格式化的sql语句
    sql = 'insert into foods(id,foodname,picsrc,url,foodmaterial,foodstep,fooddoor) values(%s,%s,%s,%s,%s,%s,%s) '

    for page in range(10,95888):#(95888-10)道菜
        url = f'https://home.meishichina.com/recipe-{page}.html'
        response = requests.get(url=url, hea

你可能感兴趣的:(Python,python,数据库)