import
requests
from
lxml
import
etree
import
os
url1
=
"http://www.nipic.com/photo/shengwu/yulei/index.html"
data1
=
requests.get(url1).text
s1
=
etree.HTML(data1)
pics_href
=
s1.xpath(
"/html/body/div[@class='new-layout-width mbt-area clearfix layout-width']/div[@class='fl new-search-main']/div[@class='new-search-result overflow-hidden']/ul/li/a/@href"
)
i
=
1
for
pic_href
in
pics_href:
try
:
url2
=
pic_href
data2
=
requests.get(url2).text
s2
=
etree.HTML(data2)
pic_list
=
s2.xpath(
"//*[@id='J_worksImg']/@src"
)
pic_url
=
pic_list[
0
]
root
=
"f://Pyspider//pics//"
path
=
root
+
pic_url.split(
'/'
)[
-
1
]
if
not
os.path.exists(root):
os.mkdir(root)
if
not
os.path.exists(path):
r
=
requests.get(pic_url)
with
open
(path,
'wb'
) as f:
f.write(r.content)
f.close()
print
(
'第{}张图片保存成功'
.
format
(i))
i
+
=
1
else
:
print
(
'此图片已存在'
)
except
:
print
(
'图片地址异常'
)