请求库:requests
解析库:lxml
目的:爬取某位CSDN博主的文章标题
import requests
from lxml import etree
url = "https://yetingyun.blog.csdn.net/article/list/1"
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/87.0.4280.88 Safari/537.36"
}
req = requests.get(url, headers=headers