path_deploy.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309
  1. import os.path
  2. from functools import partial
  3. from contextlib import contextmanager
  4. import tornado
  5. from tornado import template
  6. from tornado.web import HTTPError, Finish
  7. from tornado.web import StaticFileHandler
  8. from . import utils
  9. from .httpbased import HttpHandler
  10. from .tornado import webio_handler, set_ioloop
  11. from .tornado_http import TornadoHttpContext
  12. from .utils import cdn_validation, make_applications
  13. from ..session import register_session_implement, CoroutineBasedSession, ThreadBasedSession
  14. from ..utils import get_free_port, STATIC_PATH, parse_file_size
  15. def filename_ok(f):
  16. return not f.startswith(('.', '_'))
  17. def valid_and_norm_path(base, subpath):
  18. """Join the sub-path to base path. This function always ensure the result path is a subpath of base path.
  19. :param str base: MUST a absolute path
  20. :param str subpath: sub-path under the `base` path
  21. :return: normalized result path. None returned if the sub path is not valid
  22. """
  23. subpath = subpath.lstrip('/')
  24. full_path = os.path.normpath(os.path.join(base, subpath))
  25. if not full_path.startswith(base):
  26. return None
  27. parts = subpath.split('/')
  28. for i in parts:
  29. if not filename_ok(i):
  30. return None
  31. return full_path
  32. _cached_modules = {}
  33. def _get_module(path, reload=False):
  34. # https://docs.python.org/3/library/importlib.html#importing-a-source-file-directly
  35. # https://stackoverflow.com/questions/41861427/python-3-5-how-to-dynamically-import-a-module-given-the-full-file-path-in-the
  36. global _cached_modules
  37. import importlib.util
  38. @contextmanager
  39. def add_to_path(p):
  40. import sys
  41. sys.path.append(p)
  42. try:
  43. yield
  44. finally:
  45. sys.path.remove(p)
  46. if not reload and path in _cached_modules:
  47. return _cached_modules[path]
  48. # import_name will be the `__name__` of the imported module
  49. import_name = "__pywebio__"
  50. with add_to_path(os.path.dirname(path)):
  51. spec = importlib.util.spec_from_file_location(import_name, path, submodule_search_locations=None)
  52. module = importlib.util.module_from_spec(spec)
  53. spec.loader.exec_module(module)
  54. _cached_modules[path] = module
  55. return module
  56. _app_list_tpl = template.Template("""
  57. <!DOCTYPE html>
  58. <html lang="">
  59. <head>
  60. <meta charset="UTF-8">
  61. <meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
  62. <title>{{ title }}</title>
  63. <meta name="description" content="PyWebIO applications index">
  64. <style>a{text-decoration:none}</style>
  65. </head>
  66. <body>
  67. <h1>{{ title }}</h1>
  68. <hr>
  69. <pre style="line-height: 1.6em; font-size: 16px;">
  70. {% for f in files %} <a href="{{ f }}">{{ f }}</a>
  71. {% end %}</pre>
  72. <hr>
  73. </body>
  74. </html>
  75. """.strip())
  76. def default_index_page(path, base):
  77. urlpath = path[len(base):] or '/'
  78. title = "Index of %s" % urlpath
  79. dirs = [] if path == base else ['../']
  80. files = []
  81. for f in os.listdir(path):
  82. if not filename_ok(f):
  83. continue
  84. if os.path.isfile(os.path.join(path, f)):
  85. if f.endswith('.py'):
  86. files.append(f[:-3])
  87. else:
  88. dirs.append(f + '/')
  89. return _app_list_tpl.generate(files=dirs + files, title=title)
  90. def get_app_from_path(request_path, base, index, reload=False):
  91. """Get PyWebIO app
  92. :param str request_path: request path
  93. :param str base: dir base path, MUST a absolute path
  94. :param callable index:
  95. :return: ('error', http error code in int) / ('app', pywebio task function) / ('html', Html content in bytes)
  96. """
  97. path = valid_and_norm_path(base, request_path)
  98. if path is None:
  99. return 'error', 403
  100. if os.path.isdir(path):
  101. if not request_path.endswith('/'):
  102. return 'error', 404
  103. if os.path.isfile(os.path.join(path, 'index.py')):
  104. path = os.path.join(path, 'index.py')
  105. elif index:
  106. content = index(path)
  107. return 'html', content
  108. else:
  109. return 'error', 404
  110. else:
  111. path += '.py'
  112. if not os.path.isfile(path):
  113. return 'error', 404
  114. module = _get_module(path, reload=reload)
  115. if hasattr(module, 'main'):
  116. return 'app', make_applications(module.main)
  117. return 'error', 404
  118. def _path_deploy(base, port=0, host='', static_dir=None, cdn=True, max_payload_size=2 ** 20 * 200,
  119. **tornado_app_settings):
  120. if not host:
  121. host = '0.0.0.0'
  122. if port == 0:
  123. port = get_free_port()
  124. tornado_app_settings = {k: v for k, v in tornado_app_settings.items() if v is not None}
  125. abs_base = os.path.normpath(os.path.abspath(base))
  126. cdn = cdn_validation(cdn, 'warn', stacklevel=4) # if CDN is not available, warn user and disable CDN
  127. cdn_url = '/_pywebio_static/' if not cdn else cdn
  128. register_session_implement(CoroutineBasedSession)
  129. register_session_implement(ThreadBasedSession)
  130. RequestHandler = yield cdn_url, abs_base
  131. handlers = []
  132. if static_dir is not None:
  133. handlers.append((r"/static/(.*)", StaticFileHandler, {"path": static_dir}))
  134. if not cdn:
  135. handlers.append((r"/_pywebio_static/(.*)", StaticFileHandler, {"path": STATIC_PATH}))
  136. handlers.append((r"/.*", RequestHandler))
  137. print('Listen on %s:%s' % (host or '0.0.0.0', port))
  138. set_ioloop(tornado.ioloop.IOLoop.current()) # to enable bokeh app
  139. app = tornado.web.Application(handlers=handlers, **tornado_app_settings)
  140. app.listen(port, address=host, max_buffer_size=max_payload_size)
  141. tornado.ioloop.IOLoop.current().start()
  142. def path_deploy(base, port=0, host='',
  143. index=True, static_dir=None,
  144. reconnect_timeout=0,
  145. cdn=True, debug=True,
  146. allowed_origins=None, check_origin=None,
  147. max_payload_size='200M',
  148. **tornado_app_settings):
  149. """Deploy the PyWebIO applications from a directory.
  150. The server communicates with the browser using WebSocket protocol.
  151. :param str base: Base directory to load PyWebIO application.
  152. :param int port: The port the server listens on.
  153. :param str host: The host the server listens on.
  154. :param bool/callable index: Whether to provide a default index page when request a directory, default is ``True``.
  155. ``index`` also accepts a function to custom index page, which receives the requested directory path as parameter
  156. and return HTML content in string.
  157. You can override the index page by add a `index.py` PyWebIO app file to the directory.
  158. :param str static_dir: Directory to store the application static files.
  159. The files in this directory can be accessed via ``http://<host>:<port>/static/files``.
  160. For example, if there is a ``A/B.jpg`` file in ``static_dir`` path,
  161. it can be accessed via ``http://<host>:<port>/static/A/B.jpg``.
  162. :param int reconnect_timeout: The client can reconnect to server within ``reconnect_timeout`` seconds after an unexpected disconnection.
  163. If set to 0 (default), once the client disconnects, the server session will be closed.
  164. The rest arguments of ``path_deploy()`` have the same meaning as for :func:`pywebio.platform.tornado.start_server`
  165. """
  166. utils.MAX_PAYLOAD_SIZE = max_payload_size = parse_file_size(max_payload_size)
  167. # Since some cloud server may close idle connections (such as heroku),
  168. # use `websocket_ping_interval` to keep the connection alive
  169. tornado_app_settings.setdefault('websocket_ping_interval', 30)
  170. tornado_app_settings.setdefault('websocket_max_message_size', max_payload_size) # Backward compatible
  171. tornado_app_settings['websocket_max_message_size'] = parse_file_size(tornado_app_settings['websocket_max_message_size'])
  172. gen = _path_deploy(base, port=port, host=host,
  173. static_dir=static_dir,
  174. cdn=cdn, debug=debug,
  175. max_payload_size=max_payload_size,
  176. **tornado_app_settings)
  177. cdn_url, abs_base = next(gen)
  178. index_func = {True: partial(default_index_page, base=abs_base), False: lambda p: '403 Forbidden'}.get(index, index)
  179. Handler = webio_handler(lambda: None, cdn_url, allowed_origins=allowed_origins,
  180. check_origin=check_origin, reconnect_timeout=reconnect_timeout)
  181. class WSHandler(Handler):
  182. def get_app(self):
  183. reload = self.get_query_argument('reload', None) is not None
  184. type, res = get_app_from_path(self.request.path, abs_base, index=index_func, reload=reload)
  185. if type == 'error':
  186. raise HTTPError(status_code=res)
  187. elif type == 'html':
  188. raise Finish(res)
  189. app_name = self.get_query_argument('app', 'index')
  190. app = res.get(app_name) or res['index']
  191. return app
  192. gen.send(WSHandler)
  193. gen.close()
  194. def path_deploy_http(base, port=0, host='',
  195. index=True, static_dir=None,
  196. cdn=True, debug=True,
  197. allowed_origins=None, check_origin=None,
  198. session_expire_seconds=None,
  199. session_cleanup_interval=None,
  200. max_payload_size='200M',
  201. **tornado_app_settings):
  202. """Deploy the PyWebIO applications from a directory.
  203. The server communicates with the browser using HTTP protocol.
  204. The ``base``, ``port``, ``host``, ``index``, ``static_dir`` arguments of ``path_deploy_http()``
  205. have the same meaning as for :func:`pywebio.platform.path_deploy`
  206. The rest arguments of ``path_deploy_http()`` have the same meaning as for :func:`pywebio.platform.tornado_http.start_server`
  207. """
  208. utils.MAX_PAYLOAD_SIZE = max_payload_size = parse_file_size(max_payload_size)
  209. gen = _path_deploy(base, port=port, host=host,
  210. static_dir=static_dir,
  211. cdn=cdn, debug=debug,
  212. max_payload_size=max_payload_size,
  213. **tornado_app_settings)
  214. cdn_url, abs_base = next(gen)
  215. index_func = {True: partial(default_index_page, base=abs_base), False: lambda p: '403 Forbidden'}.get(index, index)
  216. def get_app(context: TornadoHttpContext):
  217. reload = context.request_url_parameter('reload', None) is not None
  218. type, res = get_app_from_path(context.get_path(), abs_base, index=index_func, reload=reload)
  219. if type == 'error':
  220. raise HTTPError(status_code=res)
  221. elif type == 'html':
  222. raise Finish(res)
  223. app_name = context.request_url_parameter('app', 'index')
  224. return res.get(app_name) or res['index']
  225. handler = HttpHandler(app_loader=get_app, cdn=cdn_url,
  226. session_expire_seconds=session_expire_seconds,
  227. session_cleanup_interval=session_cleanup_interval,
  228. allowed_origins=allowed_origins,
  229. check_origin=check_origin)
  230. class ReqHandler(tornado.web.RequestHandler):
  231. def options(self):
  232. return self.get()
  233. def post(self):
  234. return self.get()
  235. def get(self):
  236. context = TornadoHttpContext(self)
  237. self.write(handler.handle_request(context))
  238. gen.send(ReqHandler)
  239. gen.close()