import urllib.request
import json
import codecs
class info(object):
#@classmethod
def moviedown(url):
#网址
url = "https://movie.douban.com/j/new_search_subjects?sort=T&range=0,10&tags=%E7%94%B5%E5%BD%B1&start=9960"
#请求
request = urllib.request.Request(url)
#爬取结果
response = urllib.request.urlopen(request)
data = response.read()
#设置解码方式
data = data.decode('utf-8')
data1 = []
data1=json.loads(data)#这一步pyrhon 转成字典
#data1['data']------>这是list
#data1['data'][0]-------->这是dict
print(data1['data'][0]['rate']);
str = "\r\n"
for item in data1['data']:
#print json.dumps(item)
str = str + "insert into tencent(title,rate) values "
str = str + "('%s','%s');\r\n" % (item['title'],item['rate'])
file_object = codecs.open('tencent.sql', 'a' ,"utf-8")
file_object.write(str)
file_object.close()
print ("success") ;
test = info()
test.m
python 爬虫抓豆瓣电影,并存入数据库
最新推荐文章于 2025-06-05 17:29:45 发布