xpath 爬取图片

时间:2025-05-12 08:22:50
import requests import re from lxml import etree from urllib3 import request # 页数 def page(url,totalpage): changepage=[] for i in range(1,totalpage+1): page_number=('/page/\d+','/page/%s'%i,url,) (page_number) return(changepage) url='http:///' text=(url).text html = (text) r2=('//div[@class="content"]//span') #name r1=('//div[@class="author clearfix"]//a/@title') #content r3=('//img/@src')#picture def put(r1,r2): output=[] for name in r1: (name) for each in r2: (each) break i=0 del r3[0] for every in r3: html=(every) pic= string='output/' + str(i) + '.jpg' fg=open(string,'wb') (pic) () i+=1