标签:headers als retrieve out hand lib 创建 form data default
import urllib.requestresponse = urllib.request.urlopen("http://www.fishc.com")#是一个HTTP响应类型html =response.read()#读取响应内容,为bytes类型# print(type(html),html) #输出的为一串<class ‘bytes‘>html = html.decode(‘utf-8‘)#bytes类型解码为str类型print(html)
import urllib.requestresponse = urllib.request.urlopen("http://placekitten.com/g/400/400")cat_img = response.read()with open(‘cat_400_400.jpg‘, ‘wb‘) as f:f.write(cat_img)


import urllib.requestimport urllib.parseimport jsonimport timewhile True:content = input("请输入需要翻译的内容《输入q!退出程序》:")if content == ‘q!‘:breakurl = "http://fanyi.youdao.com/translate?smartresult=dict&smartresult=rule&smartresult=ugc&sessionFrom=http://www.youdao.com/" #即RequestURL中的链接data = {}#Form Data中的内容,适当删除无用信息data[‘i‘] = contentdata[‘smartresult‘] = ‘dict‘data[‘client‘] = ‘fanyideskweb‘data[‘doctype‘] = ‘json‘data[‘version‘] = ‘2.1‘data[‘keyfrom‘] = ‘fanyi.web‘data[‘action‘] = ‘FY_BY_CLICKBUTTON‘data[‘typoResult‘] = ‘true‘data = urllib.parse.urlencode(data).encode(‘utf-8‘)#打开网址并提交表单response = urllib.request.urlopen(url, data)html = response.read().decode(‘utf-8‘)target = json.loads(html)print("翻译结果:%s" % (target[‘translateResult‘][0][0][‘tgt‘]))time.sleep(2)
import urllib.requestimport randomurl = ‘http://www.whatismyip.com.tw/‘iplist = [‘61.191.41.130:80‘,‘115.46.97.122:8123‘,]#参数是一个字典{‘类型‘:‘代理IP:端口号‘}proxy_support = urllib.request.ProxyHandler({‘http‘:random.choice(iplist)})#定制、创建一个openeropener = urllib.request.build_opener(proxy_support)#通过addheaders修改User-Agentopener.addheaders = [(‘User-Agent‘,‘Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/48.0.2564.97 Safari/537.36‘)]#安装openerurllib.request.install_opener(opener)response = urllib.request.urlopen(url)html = response.read().decode(‘utf-8‘)print(html)
- import urllib.request
import redef open_url(url):#打开URL并修改header,将URL内容读取req = urllib.request.Request(url)#通过add_header修改User-Agentreq.add_header(‘User-Agent‘,‘Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/48.0.2564.97 Safari/537.36‘)page = urllib.request.urlopen(req)html = page.read().decode(‘utf-8‘)return htmldef get_img(html):p = r‘<img class="BDE_Image" src="([^"]+\.jpg)‘imglist = re.findall(p,html)#寻找到图片的链接for each in imglist:filename = each.split("/")[-1]urllib.request.urlretrieve(each,filename,None)#保存图片if __name__ == ‘__main__‘:url = "https://tieba.baidu.com/p/5090206152"get_img(open_url(url))
标签:headers als retrieve out hand lib 创建 form data default
原文地址:http://www.cnblogs.com/tcheng/p/6886351.html