标签:odi www. encoding port 解析 from 异常 urllib retrieve
#coding=utf-8 import requests from lxml import etree import urllib url = ‘http://www.7160.com/zhenrenxiu/56786/‘ def parse_content(content): tree = etree.HTML(content) title = tree.xpath("/html/body/div/div[2]/div[1]/div[2]/h1/text()") url = tree.xpath("/html/body/div/div[2]/div[1]/div[2]/div[3]/p/a/img/@src") print(title) print(url[0]) return (title[0],url[0]) def store_img(title,img_url): urllib.request.urlretrieve(img_url, ‘/craw/‘+title+".jpg") print(‘/craw/‘ + title + ".jpg 保存成功") try: res = requests.get(url) res.encoding = ‘gb2312‘ #解析 返回url title,img_url = parse_content(res.text) store_img(title,img_url) except Exception as e: print("异常"+str(e))
标签:odi www. encoding port 解析 from 异常 urllib retrieve
原文地址:https://www.cnblogs.com/php-linux/p/9678099.html