[root@yyjk /tmp]#cat fh2.html
<div><a target="aaa">科比</a></div>
<div><a target="bbb">乔丹</a></div>
<div><a target="aaa">乔治</a></div>
<a target="aaa">艾弗森</a>
[root@yyjk /tmp]#python a2.py
{'Connection': 'keep-alive', 'Accept-Encoding': 'gzip, deflate', 'Accept': '*/*', 'User-Agent': 'python-requests/2.18.4'}
<type 'unicode'>
科比
乔治
[root@yyjk /tmp]#vim a2.py ^C
[root@yyjk /tmp]#cat a2.py
# !/usr/bin/env python
# -*- coding: utf-8 -*-
import urllib2
import urllib
import cookielib
import json
import httplib
import re
import requests
import StringIO
import time
from lxml import etree
s = requests.sessi
根据target属性爬取
最新推荐文章于 2024-07-24 02:04:40 发布