# -*- coding=utf-8 -*-
import os
import re
import sys
from twisted.internet import protocol, reactor
file_url = """GET /sw-search-sp/soft/3a/12350/QQ_8.2.17724.0_setup.1459155849.exe HTTP/1.1
Host: dlsw.baidu.com
Connection: keep-alive
Accept: text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8
Accept-Encoding: gzip, deflate, sdch
Accept-Language: zh-CN,zh;q=0.8
Upgrade-Insecure-Requests: 1
User-Agent: Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/48.0.2564.97 Safari/537.36
"""
class client_demo(protocol.Protocol):
file_handle = None
total_size = 0
received_size = 0
rep_header = None
SAVE_FILE_HEADER = "E:\\python\\twisted\\header.txt"
SAVE_FILE_NAME = "E:\\python\\twisted\\file.exe"
def connectionMade(self):
print("connectionMade")
print("remote client: {}:{}".format(self.transport.getPeer().host, self.transport.getPeer().port))
if os.path.exists(self.SAVE_FILE_HEADER):
os.remove(self.SAVE_FILE_HEADER)
if os.path.exists(self.SAVE_FILE_NAME):
os.remove(self.SAVE_FILE_NAME)
self.transport.write(file_url)
def connectionLost(self, reason):
print("connectionLost")
print("remote client: {}:{}".format(self.transport.getPeer().host, self.transport.getPeer().port))
print("reason: {}".format(reason))
if self.file_handle:
self.file_handle.close()
print("total received size: {}".format(self.received_size))
def dataReceived(self, data):
try:
hdr_end_pos = data.find("\r\n\r\n")
#get response header
if not self.rep_header:
self.rep_header = data[:hdr_end_pos]
print(self.rep_header)
self.total_size = re.findall("Content-Length:\s(\d+)\r\n", self.rep_header, re.IGNORECASE)[0]
#get response first packet of data
if not self.file_handle:
self.file_handle = open(self.SAVE_FILE_NAME, "wb")
file_data = data[hdr_end_pos + 4:]
else:
file_data = data
self.received_size += len(file_data)
sys.stdout.write("dataReceived: {} bytes, {}/{} bytes\r".format(len(data), self.received_size, self.total_size))
sys.stdout.flush()
self.file_handle.write(file_data)
except Exception as e:
print("Error: {}".format(e))
class client_factory(protocol.ClientFactory):
protocol = client_demo
def clientConnectionFailed(self, connector, reason):
print("clientConnectionFailed")
reactor.stop()
def clientConnectionLost(self, connector, reason):
print("clientConnectionLost")
reactor.stop()
def main():
c = client_factory()
reactor.connectTCP("dlsw.baidu.com", 80, c)
reactor.run()
if __name__ == "__main__":
main()
基于Twisted的通过HTTP协议下载文件
最新推荐文章于 2024-05-10 09:42:08 发布