tornado+gunicorn部署设置max_body_size

背景

想通过 gunicornmax_requests 配置实现重启进程,解决一些内存泄露问题。

因为gunicorn启动配置的是 tornado.web.Application 实例,并非直接使用 tornado.httpserver.HTTPServer 导致无法设置 max_body_sizemax_buffer_size

gunicore配置项 中只有 limit_request_line /limit_request_fields / limit_request_field_size 无法满足 tornado的限制配置。

现状

依赖版本如下:

  • Python3.9
  • tornado==6.5.2
  • gunicorn==23.0.0

app.py

# 定义实例
app = tornado.web.Application(url_patterns)

gunicorn.conf.py

# 因为用的docker部署有restart配置
daemon = False
# 不能设置为True, tornado的IOLoop不能被共享
preload_app = False
# 可以有效解决OOM的问题
max_requests = 102400
max_requests_jitter = 1024
# 连接的空闲时间(秒),对应 idle_connection_timeout=60
keepalive = 60
# 对应 body_timeout/请求处理超时
timeout = 60
# bind
# port = os.environ.get("PROJECT_PORT", 8000)
# bind = "0.0.0.0:{}".format(port)
worker_class = "tornado"

启动命令

gunicorn -c gunicorn.conf.py --bind 0.0.0.0:8000 --workers 2 app:app

自定义 TornadoWorker

解决方式可以通过自定义 TornadoWorker . 代码是基于 gunicorn 源码修改的,主要修改 server_class 初始化的部分,增加了 max_body_size 相关配置。

最终的是同步修改 gunicore 启动 worker_class 配置:

worker_class = "gunicorn_worker.MyTornadoWorker"

gunicorn_worker 代码实现如下:

#!/usr/bin/env python
# coding=utf-8
import typing

from gunicorn.sock import ssl_context
from gunicorn.workers.gtornado import TornadoWorker

import tornado
from tornado.wsgi import WSGIContainer
from tornado.ioloop import IOLoop, PeriodicCallback

MAX_FILE_SIZE = 100 * 1024 * 1024  # 100MB

class MyTornadoWorker(TornadoWorker):
    """专门为tornado>=6定制
    因为需要实现设置 max_body_size
    """

    def run(self) -> None:
        self.ioloop = IOLoop.instance()
        self.alive = True
        self.server_alive = False

        # tornado >= 5
        self.callbacks = []
        self.callbacks.append(PeriodicCallback(self.watchdog, 1000))
        self.callbacks.append(PeriodicCallback(self.heartbeat, 1000))
        for callback in self.callbacks:
            callback.start()
        # Assume the app is a WSGI callable if its not an
        # instance of tornado.web.Application or is an
        # instance of tornado.wsgi.WSGIApplication
        app = self.wsgi

        if not isinstance(app, WSGIContainer) and not isinstance(app, tornado.web.Application):
            app = WSGIContainer(app)

        # Monkey-patching HTTPConnection.finish to count the
        # number of requests being handled by Tornado. This
        # will help gunicorn shutdown the worker if max_requests
        # is exceeded.
        httpserver = tornado.httpserver.HTTPServer
        if hasattr(httpserver, "HTTPConnection"):
            old_connection_finish = httpserver.HTTPConnection.finish

            def finish(other: typing.Any) -> None:
                self.handle_request()
                old_connection_finish(other)

            httpserver.HTTPConnection.finish = finish

            server_class = httpserver
        else:

            class _HTTPServer(tornado.httpserver.HTTPServer):
                def on_close(instance: typing.Any, server_conn: typing.Any) -> None:
                    self.handle_request()
                    super().on_close(server_conn)

            server_class = _HTTPServer

        if self.cfg.is_ssl:
            server = server_class(
                app,
                ssl_options=ssl_context(self.cfg),
                max_body_size=MAX_FILE_SIZE,
                max_buffer_size=MAX_FILE_SIZE,
            )
        else:
            server = server_class(
                app,
                max_body_size=MAX_FILE_SIZE,
                max_buffer_size=MAX_FILE_SIZE,
            )

        self.server = server
        self.server_alive = True

        for s in self.sockets:
            s.setblocking(0)
            if hasattr(server, "add_socket"):  # tornado > 2.0
                server.add_socket(s)
            elif hasattr(server, "_sockets"):  # tornado 2.0
                server._sockets[s.fileno()] = s

        server.no_keep_alive = self.cfg.keepalive <= 0
        server.start(num_processes=1)
        self.ioloop.start()

我给你我的代码,你在我代码上去优化吧,server: import tornado.ioloop import tornado.web import threading import time import os import logging import asyncio from concurrent.futures import ThreadPoolExecutor from handlers import MainHandler, WSHandler, UpdatePoolHandler, FileListHandler, FileDownloadHandler, FilePreviewHandler, ManualScanHandler from file_utils import scan_pools # 配置日志 logging.basicConfig( level=logging.INFO, format='%(asctime)s - %(name)s - %(levelname)s - %(message)s' ) logger = logging.getLogger("ResourceManager") # 自定义线程池(用于异步执行资源池扫描等阻塞操作) executor = ThreadPoolExecutor(4) # 根据 CPU 核心数调整线程池大小 # 设置 asyncio 默认事件循环的执行器为线程池 asyncio.get_event_loop().set_default_executor(executor) # 修复模板路径和路由配置 def make_app(): base_dir = os.path.dirname(os.path.abspath(__file__)) template_path = os.path.join(base_dir, "templates") static_path = os.path.join(base_dir, "static") return tornado.web.Application( [ (r"/", MainHandler), (r"/ws", WSHandler), (r"/update_pool", UpdatePoolHandler), (r"/files/(.+)", FileListHandler), (r"/download", FileDownloadHandler), (r"/preview", FilePreviewHandler), (r"/scan", ManualScanHandler), (r"/static/(.*)", tornado.web.StaticFileHandler, {"path": static_path}), (r"/admin", MainHandler), ], template_path=template_path, cookie_secret="YOUR_SECRET_KEY", login_url="/login", debug=False, # 生产环境建议关闭 debug max_buffer_size=1024 * 1024 * 1024, # 最大缓冲区大小(1GB) chunked_write_timeout=60000, # 分块写入超时时间(毫秒) idle_connection_timeout=60000, # 空闲连接超时时间 executor=executor # 使用自定义线程池 ) if __name__ == "__main__": try: # 初始化资源池扫描 scan_pools() logger.info("资源池扫描初始化完成") except Exception as e: logger.error(f"资源池扫描初始化失败: {str(e)}") # 创建并启动应用 app = make_app() app.listen(8888) logger.info("服务器运行中: http://localhost:8888") try: # 启动事件循环 tornado.ioloop.IOLoop.current().start() except KeyboardInterrupt: logger.info("\n服务器正在关闭...") except Exception as e: logger.error(f"服务器异常停止: {str(e)}") finally: # 清理资源(可选) executor.shutdown(wait=True) #预览视频下载和下载按钮下载速度大幅度提升,txt文本实现在线预览,word等文档预览会下载而不是显示不支持预览,本地速度快,跨设备比较慢 handlers: import tornado.web import tornado.websocket import json import os import mimetypes import urllib.parse from config import RESOURCE_POOLS, save_config, ADMIN_IP, ADMIN_PASSWORD from file_utils import get_file_list, scan_pools import aiofiles # 改进管理员检查 def is_admin(handler): """检查当前用户是否有管理员权限""" client_ip = handler.request.remote_ip # 支持IPv4和IPv6的本地地址 return client_ip in ["127.0.0.1", "::1", "localhost"] or \ client_ip == ADMIN_IP or \ handler.get_cookie("admin_auth") == ADMIN_PASSWORD # handlers.py # 手动资源扫描接口 class ManualScanHandler(tornado.web.RequestHandler): async def get(self): if not is_admin(self): self.set_status(403) self.write("权限不足") return # 使用线程池异步执行 scan_pools await tornado.ioloop.IOLoop.current().run_in_executor(executor, scan_pools) WSHandler.broadcast_update() # 通知前端更新 self.write("资源池已手动扫描完成") # 主页面处理器 class MainHandler(tornado.web.RequestHandler): def get(self): try: if self.request.path == "/admin": if not is_admin(self): self.redirect("/") return self.render("admin.html", pools=RESOURCE_POOLS) else: if is_admin(self): self.render("admin.html", pools=RESOURCE_POOLS) else: self.render("user.html", pools=RESOURCE_POOLS) except FileNotFoundError: self.set_status(404) self.render("404.html") except Exception as e: self.set_status(500) self.render("500.html", error=str(e)) # WebSocket实时更新处理器 class WSHandler(tornado.websocket.WebSocketHandler): clients = set() def open(self): self.clients.add(self) self.send_update() def on_message(self, message): # 处理客户端消息 pass def on_close(self): self.clients.remove(self) def send_update(self): """发送更新到所有连接的客户端""" for client in self.clients: client.write_message(json.dumps(RESOURCE_POOLS)) @classmethod def broadcast_update(cls): """广播更新到所有客户端""" for client in cls.clients: client.write_message(json.dumps(RESOURCE_POOLS)) # 资源池更新处理器(仅管理员) class UpdatePoolHandler(tornado.web.RequestHandler): def post(self): if not is_admin(self): self.write({"status": "error", "message": "无权限执行此操作"}) return data = json.loads(self.request.body) pool_name = data.get("pool") new_path = data.get("path") if pool_name and new_path and pool_name in RESOURCE_POOLS: # 验证路径有效性 if not os.path.exists(new_path) or not os.path.isdir(new_path): self.write({"status": "error", "message": "路径不存在或不是目录"}) return # 更新路径并扫描文件 RESOURCE_POOLS[pool_name]["path"] = new_path try: RESOURCE_POOLS[pool_name]["files"] = [ f for f in os.listdir(new_path) if os.path.isfile(os.path.join(new_path, f)) ] except Exception as e: RESOURCE_POOLS[pool_name]["files"] = [f"错误: {str(e)}"] # 保存配置并广播更新 save_config() WSHandler.broadcast_update() self.write({"status": "success"}) else: self.write({"status": "error", "message": "无效资源池或路径"}) # 文件列表处理器 class FileListHandler(tornado.web.RequestHandler): async def get(self, pool_name): if pool_name not in RESOURCE_POOLS: self.set_status(404) self.render("404.html") return # 获取文件列表数据 files = get_file_list(pool_name) # 渲染模板 self.render("file_list.html", pool_name=pool_name, files=files, pool_info=RESOURCE_POOLS[pool_name], is_admin=is_admin(self)) # handlers.py # 文件下载处理器 class FileDownloadHandler(tornado.web.RequestHandler): async def get(self): pool_name = self.get_argument("pool") file_name = self.get_argument("file") if pool_name not in RESOURCE_POOLS: self.set_status(404) self.render("404.html") return pool_path = RESOURCE_POOLS[pool_name]["path"] file_path = os.path.join(pool_path, file_name) # 防止路径遍历攻击 real_path = os.path.realpath(file_path) if not real_path.startswith(os.path.realpath(pool_path)): self.set_status(403) self.write("禁止访问此文件路径") return if not os.path.exists(file_path): self.set_status(404) self.render("404.html") return file_size = os.path.getsize(file_path) range_header = self.request.headers.get('Range') start = 0 end = file_size - 1 if range_header: self.set_status(206) # Partial Content start_bytes, end_bytes = range_header.replace('bytes=', '').split('-') start = int(start_bytes) if start_bytes else 0 end = int(end_bytes) if end_bytes else file_size - 1 self.set_header('Content-Range', f'bytes {start}-{end}/{file_size}') self.set_header("Content-Length", str(end - start + 1)) encoded_filename = urllib.parse.quote(file_name.encode('utf-8')) self.set_header("Content-Type", "application/octet-stream") self.set_header("Content-Disposition", f'attachment; filename*=UTF-8\'\'{encoded_filename}') self.set_header("Accept-Ranges", "bytes") chunk_size = 1024 * 1024 * 4 # 4MB try: async with aiofiles.open(file_path, 'rb') as f: await f.seek(start) remaining = end - start + 1 while remaining > 0: read_size = min(chunk_size, remaining) chunk = await f.read(read_size) if not chunk: break self.write(chunk) await self.flush() remaining -= len(chunk) self.finish() except tornado.iostream.StreamClosedError: # 客户端提前关闭连接,静默处理 return except Exception as e: self.set_status(500) self.write(f"Internal Server Error: {str(e)}") return class FilePreviewHandler(tornado.web.RequestHandler): async def get(self): pool_name = self.get_argument("pool") file_name = self.get_argument("file") if pool_name not in RESOURCE_POOLS: self.set_status(404) self.render("404.html") return pool_path = RESOURCE_POOLS[pool_name]["path"] file_path = os.path.join(pool_path, file_name) # 防止路径遍历攻击 real_path = os.path.realpath(file_path) if not real_path.startswith(os.path.realpath(pool_path)): self.set_status(403) self.write("禁止访问此文件路径") return if not os.path.exists(file_path): self.set_status(404) self.render("404.html") return # 获取扩展名 ext = os.path.splitext(file_name)[1].lower() # 手动定义 MIME 类型 mime_type = { '.docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document', '.xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet', '.pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation', '.pdf': 'application/pdf', '.txt': 'text/plain', '.md': 'text/markdown', '.html': 'text/html', '.css': 'text/css', '.js': 'application/javascript', '.png': 'image/png', '.jpg': 'image/jpeg', '.jpeg': 'image/jpeg', '.gif': 'image/gif', '.mp4': 'video/mp4', '.webm': 'video/webm', '.ogg': 'video/ogg', }.get(ext, mimetypes.guess_type(file_name)[0] or 'application/octet-stream') # 设置 UTF-8 编码的文件名 encoded_filename = urllib.parse.quote(file_name.encode('utf-8')) self.set_header("Content-Disposition", f'inline; filename*=UTF-8\'\'{encoded_filename}') file_size = os.path.getsize(file_path) # 区分是否是 Range 请求(预览)还是完整下载 range_header = self.request.headers.get('Range') is_download = not range_header and ext in ['.mp4', '.webm', '.ogg', '.pdf'] if is_download: # 完整下载,使用 sendfile()(Linux) 或同步读取 self.set_header('Content-Type', mime_type) self.set_header('Content-Length', str(file_size)) self.set_status(200) if os.name == 'posix': # Linux 下使用 sendfile 实现零拷贝传输 fd = os.open(file_path, os.O_RDONLY) try: await tornado.ioloop.IOLoop.current().run_in_executor( None, os.sendfile, self.request.connection.fileno(), fd, None, file_size ) finally: os.close(fd) else: # Windows 或其他系统,使用同步读取(比 aiofiles 更快) with open(file_path, 'rb') as f: while True: chunk = f.read(1024 * 1024 * 4) # 4MB if not chunk: break self.write(chunk) await self.flush() self.finish() elif ext in ['.mp4', '.webm', '.ogg', '.pdf']: # 视频预览,使用 aiofiles 支持 Range self.set_header('Accept-Ranges', 'bytes') start = 0 end = file_size - 1 if range_header: self.set_status(206) start_bytes, end_bytes = range_header.replace('bytes=', '').split('-') start = int(start_bytes) if start_bytes else 0 end = int(end_bytes) if end_bytes else file_size - 1 self.set_header('Content-Range', f'bytes {start}-{end}/{file_size}') self.set_header("Content-Length", str(end - start + 1)) self.set_header('Content-Type', mime_type) chunk_size = 4096 * 16 async with aiofiles.open(file_path, 'rb') as f: await f.seek(start) remaining = end - start + 1 while remaining > 0: chunk = await f.read(min(chunk_size, remaining)) if not chunk: break self.write(chunk) await self.flush() remaining -= len(chunk) self.finish() elif ext == '.txt': self.set_header('Content-Type', 'text/plain; charset=UTF-8') async with aiofiles.open(file_path, 'r', encoding='utf-8') as f: content = await f.read() self.write(content) self.finish() elif ext in ['.png', '.jpg', '.jpeg', '.gif', '.md', '.pdf', '.docx', '.xlsx', '.pptx']: self.set_header('Content-Type', mime_type) async with aiofiles.open(file_path, 'rb') as f: data = await f.read() self.write(data) self.finish() else: self.set_status(400) self.write("不支持预览此文件类型")
08-20
评论
成就一亿技术人!
拼手气红包6.0元
还能输入1000个字符
 
红包 添加红包
表情包 插入表情
 条评论被折叠 查看
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值