2020-04-21 09:15发布
import
requests
from
lxml
etree
def
getHTMLtext(url):
res
=
requests.get(url,timeout
30
)
# 处理中文编码问题
res.encoding
'gb2312'
# 转化html
html
etree.HTML(res.text)
# xpath提取tr标签下td的内容
HTMLtext
html.xpath(
"//tr/td/text()"
return
最多设置5个标签!
import
requests
from
lxml
import
etree
def
getHTMLtext(url):
res
=
requests.get(url,timeout
=
30
)
# 处理中文编码问题
res.encoding
=
'gb2312'
# 转化html
html
=
etree.HTML(res.text)
# xpath提取tr标签下td的内容
HTMLtext
=
html.xpath(
"//tr/td/text()"
)
return
HTMLtext
一周热门 更多>