tornado.py 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412
  1. import asyncio
  2. import fnmatch
  3. import json
  4. import logging
  5. import os
  6. import threading
  7. import typing
  8. import webbrowser
  9. from functools import partial
  10. from urllib.parse import urlparse
  11. import tornado
  12. import tornado.httpserver
  13. import tornado.ioloop
  14. import tornado.web
  15. import tornado.websocket
  16. from . import page
  17. from .adaptor import ws as ws_adaptor
  18. from .page import make_applications, render_page
  19. from .remote_access import start_remote_access_service
  20. from .utils import cdn_validation, print_listen_address
  21. from ..session import ScriptModeSession, register_session_implement_for_target, Session
  22. from ..session.base import get_session_info_from_headers
  23. from ..utils import get_free_port, wait_host_port, STATIC_PATH, check_webio_js, parse_file_size
  24. logger = logging.getLogger(__name__)
  25. _ioloop = None
  26. def set_ioloop(loop):
  27. global _ioloop
  28. _ioloop = loop
  29. def ioloop() -> tornado.ioloop.IOLoop:
  30. """获得运行Tornado server的IOLoop
  31. 本方法当前仅在显示boken app时使用
  32. This method is currently only used when displaying boken app"""
  33. global _ioloop
  34. return _ioloop
  35. def _check_origin(origin, allowed_origins, handler: tornado.websocket.WebSocketHandler):
  36. if _is_same_site(origin, handler):
  37. return True
  38. return any(
  39. fnmatch.fnmatch(origin, pattern)
  40. for pattern in allowed_origins
  41. )
  42. def _is_same_site(origin, handler: tornado.websocket.WebSocketHandler):
  43. parsed_origin = urlparse(origin)
  44. origin = parsed_origin.netloc
  45. origin = origin.lower()
  46. host = handler.request.headers.get("Host")
  47. # Check to see that origin matches host directly, including ports
  48. return origin == host
  49. class WebSocketConnection(ws_adaptor.WebSocketConnection):
  50. def __init__(self, context: tornado.websocket.WebSocketHandler):
  51. self.context = context
  52. def get_query_argument(self, name) -> typing.Optional[str]:
  53. return self.context.get_query_argument(name, None)
  54. def make_session_info(self) -> dict:
  55. session_info = get_session_info_from_headers(self.context.request.headers)
  56. session_info['user_ip'] = self.context.request.remote_ip
  57. session_info['request'] = self.context.request
  58. session_info['backend'] = 'tornado'
  59. session_info['protocol'] = 'websocket'
  60. return session_info
  61. def write_message(self, message: dict):
  62. self.context.write_message(json.dumps(message))
  63. def closed(self) -> bool:
  64. return not bool(self.context.ws_connection)
  65. def close(self):
  66. self.context.close()
  67. def _webio_handler(applications=None, cdn=True, reconnect_timeout=0, check_origin_func=_is_same_site): # noqa: C901
  68. """
  69. :param dict applications: dict of `name -> task function`
  70. :param bool/str cdn: Whether to load front-end static resources from CDN
  71. :param callable check_origin_func: check_origin_func(origin, handler) -> bool
  72. :return: Tornado RequestHandler class
  73. """
  74. check_webio_js()
  75. if applications is None:
  76. applications = dict(index=lambda: None) # mock PyWebIO app
  77. ws_adaptor.set_expire_second(reconnect_timeout)
  78. tornado.ioloop.IOLoop.current().spawn_callback(ws_adaptor.session_clean_task)
  79. class Handler(tornado.websocket.WebSocketHandler):
  80. def get_app(self):
  81. app_name = self.get_query_argument('app', 'index')
  82. app = applications.get(app_name) or applications['index']
  83. return app
  84. def get_cdn(self):
  85. if cdn is True and self.get_query_argument('_pywebio_cdn', '') == 'false':
  86. return False
  87. return cdn
  88. async def get(self, *args, **kwargs) -> None:
  89. """http GET request"""
  90. if self.request.headers.get("Upgrade", "").lower() != "websocket":
  91. # Backward compatible
  92. # Frontend detect whether the backend is http server
  93. if self.get_query_argument('test', ''):
  94. return self.write('')
  95. app = self.get_app()
  96. html = render_page(app, protocol='ws', cdn=self.get_cdn())
  97. return self.write(html)
  98. else:
  99. await super().get()
  100. def check_origin(self, origin):
  101. return check_origin_func(origin=origin, handler=self)
  102. def get_compression_options(self):
  103. # Non-None enables compression with default options.
  104. return {}
  105. _handler: ws_adaptor.WebSocketHandler
  106. def open(self):
  107. conn = WebSocketConnection(self)
  108. self._handler = ws_adaptor.WebSocketHandler(
  109. connection=conn, application=self.get_app(), reconnectable=bool(reconnect_timeout)
  110. )
  111. def on_message(self, message):
  112. self._handler.send_client_data(message)
  113. def on_close(self):
  114. self._handler.notify_connection_lost()
  115. return Handler
  116. def webio_handler(applications, cdn=True, reconnect_timeout=0, allowed_origins=None, check_origin=None):
  117. """Get the ``RequestHandler`` class for running PyWebIO applications in Tornado.
  118. The ``RequestHandler`` communicates with the browser by WebSocket protocol.
  119. The arguments of ``webio_handler()`` have the same meaning as for :func:`pywebio.platform.tornado.start_server`
  120. """
  121. applications = make_applications(applications)
  122. for target in applications.values():
  123. register_session_implement_for_target(target)
  124. cdn = cdn_validation(cdn, 'error') # if CDN is not available, raise error
  125. if check_origin is None:
  126. check_origin_func = partial(_check_origin, allowed_origins=allowed_origins or [])
  127. else:
  128. check_origin_func = lambda origin, handler: _is_same_site(origin, handler) or check_origin(origin)
  129. return _webio_handler(applications=applications, cdn=cdn, check_origin_func=check_origin_func,
  130. reconnect_timeout=reconnect_timeout)
  131. async def open_webbrowser_on_server_started(host, port):
  132. url = 'http://%s:%s' % (host, port)
  133. is_open = await wait_host_port(host, port, duration=20)
  134. if is_open:
  135. logger.info('Try open %s in web browser' % url)
  136. # webbrowser.open() may block, so invoke it in thread
  137. threading.Thread(target=webbrowser.open, args=(url,), daemon=True).start()
  138. else:
  139. logger.error('Open %s in web browser failed.' % url)
  140. def _setup_server(webio_handler, port=0, host='', static_dir=None, max_buffer_size=2 ** 20 * 200,
  141. **tornado_app_settings):
  142. if port == 0:
  143. port = get_free_port()
  144. handlers = [(r"/", webio_handler)]
  145. if static_dir is not None:
  146. handlers.append((r"/static/(.*)", tornado.web.StaticFileHandler, {"path": static_dir}))
  147. handlers.append((r"/(.*)", tornado.web.StaticFileHandler, {"path": STATIC_PATH, 'default_filename': 'index.html'}))
  148. app = tornado.web.Application(handlers=handlers, **tornado_app_settings)
  149. # Credit: https://stackoverflow.com/questions/19074972/content-length-too-long-when-uploading-file-using-tornado
  150. server = app.listen(port, address=host, max_buffer_size=max_buffer_size)
  151. return server, port
  152. def start_server(applications, port=0, host='',
  153. debug=False, cdn=True, static_dir=None,
  154. remote_access=False,
  155. reconnect_timeout=0,
  156. allowed_origins=None, check_origin=None,
  157. auto_open_webbrowser=False,
  158. max_payload_size='200M',
  159. **tornado_app_settings):
  160. """Start a Tornado server to provide the PyWebIO application as a web service.
  161. The Tornado server communicates with the browser by WebSocket protocol.
  162. Tornado is the default backend server for PyWebIO applications,
  163. and ``start_server`` can be imported directly using ``from pywebio import start_server``.
  164. :param list/dict/callable applications: PyWebIO application.
  165. Can be a task function, a list of functions, or a dictionary.
  166. Refer to :ref:`Advanced topic: Multiple applications in start_server() <multiple_app>` for more information.
  167. When the task function is a coroutine function, use :ref:`Coroutine-based session <coroutine_based_session>` implementation,
  168. otherwise, use thread-based session implementation.
  169. :param int port: The port the server listens on.
  170. When set to ``0``, the server will automatically select a available port.
  171. :param str host: The host the server listens on. ``host`` may be either an IP address or hostname.
  172. If it’s a hostname, the server will listen on all IP addresses associated with the name.
  173. ``host`` may be an empty string or None to listen on all available interfaces.
  174. :param bool debug: Tornado Server's debug mode. If enabled, the server will automatically reload for code changes.
  175. See `tornado doc <https://www.tornadoweb.org/en/stable/guide/running.html#debug-mode>`_ for more detail.
  176. :param bool/str cdn: Whether to load front-end static resources from CDN, the default is ``True``.
  177. Can also use a string to directly set the url of PyWebIO static resources.
  178. :param str static_dir: The directory to store the application static files.
  179. The files in this directory can be accessed via ``http://<host>:<port>/static/files``.
  180. For example, if there is a ``A/B.jpg`` file in ``static_dir`` path,
  181. it can be accessed via ``http://<host>:<port>/static/A/B.jpg``.
  182. :param bool remote_access: Whether to enable remote access, when enabled,
  183. you can get a temporary public network access address for the current application,
  184. others can access your application via this address.
  185. :param bool auto_open_webbrowser: Whether or not auto open web browser when server is started (if the operating system allows it) .
  186. :param int reconnect_timeout: The client can reconnect to server within ``reconnect_timeout`` seconds after an unexpected disconnection.
  187. If set to 0 (default), once the client disconnects, the server session will be closed.
  188. :param list allowed_origins: The allowed request source list. (The current server host is always allowed)
  189. The source contains the protocol, domain name, and port part.
  190. Can use Unix shell-style wildcards:
  191. - ``*`` matches everything
  192. - ``?`` matches any single character
  193. - ``[seq]`` matches any character in *seq*
  194. - ``[!seq]`` matches any character not in *seq*
  195. Such as: ``https://*.example.com`` 、 ``*://*.example.com``
  196. For detail, see `Python Doc <https://docs.python.org/zh-tw/3/library/fnmatch.html>`_
  197. :param callable check_origin: The validation function for request source.
  198. It receives the source string (which contains protocol, host, and port parts) as parameter and
  199. return ``True/False`` to indicate that the server accepts/rejects the request.
  200. If ``check_origin`` is set, the ``allowed_origins`` parameter will be ignored.
  201. :param bool auto_open_webbrowser: Whether or not auto open web browser when server is started (if the operating system allows it) .
  202. :param int/str max_payload_size: Max size of a websocket message which Tornado can accept.
  203. Messages larger than the ``max_payload_size`` (default 200MB) will not be accepted.
  204. ``max_payload_size`` can be a integer indicating the number of bytes, or a string ending with `K` / `M` / `G`
  205. (representing kilobytes, megabytes, and gigabytes, respectively).
  206. E.g: ``500``, ``'40K'``, ``'3M'``
  207. :param tornado_app_settings: Additional keyword arguments passed to the constructor of ``tornado.web.Application``.
  208. For details, please refer: https://www.tornadoweb.org/en/stable/web.html#tornado.web.Application.settings
  209. """
  210. set_ioloop(tornado.ioloop.IOLoop.current()) # to enable bokeh app
  211. cdn = cdn_validation(cdn, 'warn') # if CDN is not available, warn user and disable CDN
  212. page.MAX_PAYLOAD_SIZE = max_payload_size = parse_file_size(max_payload_size)
  213. debug = Session.debug = os.environ.get('PYWEBIO_DEBUG', debug)
  214. # Since some cloud server may close idle connections (such as heroku),
  215. # use `websocket_ping_interval` to keep the connection alive
  216. tornado_app_settings.setdefault('websocket_ping_interval', 30)
  217. tornado_app_settings.setdefault('websocket_max_message_size', max_payload_size) # Backward compatible
  218. tornado_app_settings['websocket_max_message_size'] = parse_file_size(
  219. tornado_app_settings['websocket_max_message_size'])
  220. tornado_app_settings['debug'] = debug
  221. handler = webio_handler(applications, cdn, allowed_origins=allowed_origins, check_origin=check_origin,
  222. reconnect_timeout=reconnect_timeout)
  223. _, port = _setup_server(webio_handler=handler, port=port, host=host, static_dir=static_dir,
  224. max_buffer_size=max_payload_size, **tornado_app_settings)
  225. print_listen_address(host, port)
  226. if auto_open_webbrowser:
  227. tornado.ioloop.IOLoop.current().spawn_callback(open_webbrowser_on_server_started, host or 'localhost', port)
  228. if remote_access:
  229. start_remote_access_service(local_port=port)
  230. tornado.ioloop.IOLoop.current().start()
  231. def start_server_in_current_thread_session():
  232. """启动 script mode 的server,监听可用端口,并自动打开浏览器
  233. Start the server for script mode, and automatically open the browser when the server port is available.
  234. PYWEBIO_SCRIPT_MODE_PORT环境变量可以设置监听端口,并关闭自动打开浏览器,用于测试
  235. The PYWEBIO_SCRIPT_MODE_PORT environment variable can set the listening port, just used in testing.
  236. """
  237. websocket_conn_opened = threading.Event()
  238. thread = threading.current_thread()
  239. class SingleSessionWSHandler(_webio_handler(cdn=False)):
  240. session = None
  241. instance = None
  242. closed = False
  243. def open(self):
  244. self.main_session = False
  245. cls = type(self)
  246. if SingleSessionWSHandler.session is None:
  247. self.main_session = True
  248. SingleSessionWSHandler.instance = self
  249. self.session_id = 'main'
  250. cls._connections[self.session_id] = self
  251. session_info = get_session_info_from_headers(self.request.headers)
  252. session_info['user_ip'] = self.request.remote_ip
  253. session_info['request'] = self.request
  254. session_info['backend'] = 'tornado'
  255. session_info['protocol'] = 'websocket'
  256. self.session = SingleSessionWSHandler.session = ScriptModeSession(
  257. thread, session_info=session_info,
  258. on_task_command=partial(self.send_msg_to_client, session_id=self.session_id),
  259. loop=asyncio.get_event_loop())
  260. websocket_conn_opened.set()
  261. cls._webio_sessions[self.session_id] = self.session
  262. else:
  263. self.close()
  264. def on_close(self):
  265. if SingleSessionWSHandler.session is not None and self.main_session:
  266. self.session.close()
  267. self.closed = True
  268. logger.debug('ScriptModeSession closed')
  269. async def wait_to_stop_loop(server):
  270. """当只剩当前线程和Daemon线程运行时,关闭Server
  271. When only the current thread and Daemon thread are running, close the Server"""
  272. # 包括当前线程在内的非Daemon线程数
  273. # The number of non-Daemon threads(including the current thread)
  274. alive_none_daemonic_thread_cnt = None
  275. while alive_none_daemonic_thread_cnt != 1:
  276. alive_none_daemonic_thread_cnt = sum(
  277. 1 for t in threading.enumerate() if t.is_alive() and not t.isDaemon()
  278. )
  279. await asyncio.sleep(0.5)
  280. if SingleSessionWSHandler.instance.session.need_keep_alive():
  281. while not SingleSessionWSHandler.instance.closed:
  282. await asyncio.sleep(0.5)
  283. # 关闭Websocket连接
  284. # Close the Websocket connection
  285. if SingleSessionWSHandler.instance:
  286. SingleSessionWSHandler.instance.close()
  287. server.stop()
  288. logger.debug('Closing tornado ioloop...')
  289. tasks = [t for t in asyncio.all_tasks() if t is not asyncio.current_task() and not t.done()]
  290. for task in tasks:
  291. task.cancel()
  292. # 必须需要 await asyncio.sleep ,否则上方 task.cancel() 调用无法调度生效
  293. # This line must be required, otherwise the `task.cancel()` call cannot be scheduled to take effect
  294. await asyncio.sleep(0)
  295. tornado.ioloop.IOLoop.current().stop()
  296. def server_thread():
  297. from tornado.log import access_log, app_log, gen_log
  298. access_log.setLevel(logging.ERROR)
  299. app_log.setLevel(logging.ERROR)
  300. gen_log.setLevel(logging.ERROR)
  301. loop = asyncio.new_event_loop()
  302. asyncio.set_event_loop(loop)
  303. set_ioloop(tornado.ioloop.IOLoop.current()) # to enable bokeh app
  304. port = 0
  305. if os.environ.get("PYWEBIO_SCRIPT_MODE_PORT"):
  306. port = int(os.environ.get("PYWEBIO_SCRIPT_MODE_PORT"))
  307. server, port = _setup_server(webio_handler=SingleSessionWSHandler, port=port, host='localhost',
  308. websocket_max_message_size=parse_file_size('200M'))
  309. tornado.ioloop.IOLoop.current().spawn_callback(partial(wait_to_stop_loop, server=server))
  310. if "PYWEBIO_SCRIPT_MODE_PORT" not in os.environ:
  311. tornado.ioloop.IOLoop.current().spawn_callback(open_webbrowser_on_server_started, 'localhost', port)
  312. tornado.ioloop.IOLoop.current().start()
  313. logger.debug('Tornado server exit')
  314. t = threading.Thread(target=server_thread, name='Tornado-server')
  315. t.start()
  316. websocket_conn_opened.wait()