由于内容简单,此处只做代码分享。
需求数据如图:
最终效果:
完整代码:
# https://ty.fang.lianjia.com/loupan/
import requests
from lxml import etree
import pymysql
class LJSpider():
def __init__(self):
self.num=int(input('页数:'))
self.url='https://ty.fang.lianjia.com/loupan/pg%d/'
self.headers={'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36 Edg/98.0.1108.62',}
self.connect = pymysql.connect(host='127.0.0.1', user='root', password=' ', database='rxkc', charset='utf8')
self.cursor = self.connect.cursor()
l = 'drop table if exists lianjia;'
self.cursor.execute(l)