import
requests,re,time
from
bs4
import
BeautifulSoup
s
=
time.clock()
pp
=
1
all
=
False
end
=
30
path
=
'C:\\Users\\win10\\Desktop\\python\\爬取桌面壁纸图\\壁纸\\'
def
danz(
id
):
page
=
1
while
True
:
global
pp
html
=
requests.get(
"http://www.win4000.com/wallpaper_detail_%s_%s.html"
%
(
id
,page))
if
html.status_code
=
=
404
:
break
jpg
=
BeautifulSoup(html.text,
'lxml'
)
jpg1
=
jpg.find(
'img'
,
class_
=
'pic-large'
)[
'src'
]
jpg
=
requests.get(jpg1).content
with
open
(
"%s%s.jpg"
%
(path,pp),
'wb'
) as f:
f.write(jpg)
print
(
"第%s张图片下载完成"
%
pp)
if
int
(pp)
=
=
end
and
all
=
=
False
:
e
=
time.clock()
exit(
"完成耗时%s秒"
%
(e
-
s))
page
=
page
+
1
pp
=
pp
+
1
def
m(url):
html
=
requests.get(url)
a
=
re.findall(r
'http://www.win4000.com/wallpaper_detail_(.+?).html'
,html.text)
for
aa
in
a:
danz(aa)
page
=
1
for
i
in
range
(
5
):
m(
"http://www.win4000.com/zt/dongman_%s.html"
%
page)
page
=
page
+
1
e
=
time.clock()
print
(
"完成耗时%s秒"
%
(e
-
s))