path_deploy.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345
  1. import os.path
  2. from functools import partial
  3. from contextlib import contextmanager
  4. import ast
  5. import tornado
  6. from tornado import template
  7. from tornado.web import HTTPError, Finish
  8. from tornado.web import StaticFileHandler
  9. from . import utils
  10. from .httpbased import HttpHandler
  11. from .tornado import webio_handler, set_ioloop
  12. from .tornado_http import TornadoHttpContext
  13. from .utils import cdn_validation, make_applications
  14. from ..session import register_session_implement, CoroutineBasedSession, ThreadBasedSession
  15. from ..utils import get_free_port, STATIC_PATH, parse_file_size
  16. def filename_ok(f):
  17. return not f.startswith(('.', '_'))
  18. def identifiers_info(code):
  19. """Get the identifiers and theirs docstring from python source code.
  20. :return dict:
  21. """
  22. try:
  23. tree = ast.parse(code)
  24. except Exception:
  25. return {}
  26. if not isinstance(tree, ast.Module):
  27. return {}
  28. identifier2doc = {}
  29. for node in tree.body:
  30. if isinstance(node, ast.Assign):
  31. for name in node.targets:
  32. if hasattr(name, 'id'):
  33. identifier2doc[name.id] = ''
  34. elif isinstance(node, (ast.FunctionDef, ast.AsyncFunctionDef, ast.ClassDef)):
  35. doc_string = ast.get_docstring(node) or ''
  36. title = doc_string.split('\n\n')[0]
  37. identifier2doc[node.name] = title
  38. return identifier2doc
  39. def valid_and_norm_path(base, subpath):
  40. """Join the sub-path to base path. This function always ensure the result path is a subpath of base path.
  41. :param str base: MUST a absolute path
  42. :param str subpath: sub-path under the `base` path
  43. :return: normalized result path. None returned if the sub path is not valid
  44. """
  45. subpath = subpath.lstrip('/')
  46. full_path = os.path.normpath(os.path.join(base, subpath))
  47. if not full_path.startswith(base):
  48. return None
  49. parts = subpath.split('/')
  50. for i in parts:
  51. if not filename_ok(i):
  52. return None
  53. return full_path
  54. _cached_modules = {}
  55. def _get_module(path, reload=False):
  56. # https://docs.python.org/3/library/importlib.html#importing-a-source-file-directly
  57. # https://stackoverflow.com/questions/41861427/python-3-5-how-to-dynamically-import-a-module-given-the-full-file-path-in-the
  58. global _cached_modules
  59. import importlib.util
  60. @contextmanager
  61. def add_to_path(p):
  62. import sys
  63. sys.path.append(p)
  64. try:
  65. yield
  66. finally:
  67. sys.path.remove(p)
  68. if not reload and path in _cached_modules:
  69. return _cached_modules[path]
  70. # import_name will be the `__name__` of the imported module
  71. import_name = "__pywebio__"
  72. with add_to_path(os.path.dirname(path)):
  73. spec = importlib.util.spec_from_file_location(import_name, path, submodule_search_locations=None)
  74. module = importlib.util.module_from_spec(spec)
  75. spec.loader.exec_module(module)
  76. _cached_modules[path] = module
  77. return module
  78. _app_list_tpl = template.Template("""
  79. <!DOCTYPE html>
  80. <html lang="">
  81. <head>
  82. <meta charset="UTF-8">
  83. <meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
  84. <title>{{ title }}</title>
  85. <meta name="description" content="PyWebIO applications index">
  86. <style>a{text-decoration:none;display:inline-block;min-width:{{ max_name_width }}ch}span{color:grey}</style>
  87. </head>
  88. <body>
  89. <h1>{{ title }}</h1>
  90. <hr>
  91. <pre style="line-height: 1.6em; font-size: 16px;">
  92. {% for name,doc in files %} <a href="{{ name }}">{{ name }}</a> <span>{{ doc }}</span>
  93. {% end %}</pre>
  94. <hr>
  95. </body>
  96. </html>
  97. """.strip())
  98. def default_index_page(path, base):
  99. urlpath = path[len(base):] or '/'
  100. title = "Index of %s" % urlpath
  101. dirs = [] if path == base else [('../', '')] # (name, doc)
  102. files = [] # (name, doc)
  103. for f in os.listdir(path):
  104. if not filename_ok(f):
  105. continue
  106. full_path = os.path.join(path, f)
  107. if os.path.isfile(full_path):
  108. if f.endswith('.py'):
  109. code = open(full_path, encoding='utf8').read()
  110. identifiers = identifiers_info(code)
  111. if 'main' in identifiers:
  112. files.append([f[:-3], identifiers['main']])
  113. else:
  114. dirs.append([(f + '/'), ''])
  115. items = dirs + files
  116. max_name_width = max([len(n) for n, _ in items]+[0])
  117. return _app_list_tpl.generate(files=items, title=title, max_name_width=max_name_width)
  118. def get_app_from_path(request_path, base, index, reload=False):
  119. """Get PyWebIO app
  120. :param str request_path: request path
  121. :param str base: dir base path, MUST a absolute path
  122. :param callable index:
  123. :return: ('error', http error code in int) / ('app', pywebio task function) / ('html', Html content in bytes)
  124. """
  125. path = valid_and_norm_path(base, request_path)
  126. if path is None:
  127. return 'error', 403
  128. if os.path.isdir(path):
  129. if not request_path.endswith('/'):
  130. return 'error', 404
  131. if os.path.isfile(os.path.join(path, 'index.py')):
  132. path = os.path.join(path, 'index.py')
  133. elif index:
  134. content = index(path)
  135. return 'html', content
  136. else:
  137. return 'error', 404
  138. else:
  139. path += '.py'
  140. if not os.path.isfile(path):
  141. return 'error', 404
  142. module = _get_module(path, reload=reload)
  143. if hasattr(module, 'main'):
  144. return 'app', make_applications(module.main)
  145. return 'error', 404
  146. def _path_deploy(base, port=0, host='', static_dir=None, cdn=True, max_payload_size=2 ** 20 * 200,
  147. **tornado_app_settings):
  148. if not host:
  149. host = '0.0.0.0'
  150. if port == 0:
  151. port = get_free_port()
  152. tornado_app_settings = {k: v for k, v in tornado_app_settings.items() if v is not None}
  153. abs_base = os.path.normpath(os.path.abspath(base))
  154. cdn = cdn_validation(cdn, 'warn', stacklevel=4) # if CDN is not available, warn user and disable CDN
  155. cdn_url = '/_pywebio_static/' if not cdn else cdn
  156. register_session_implement(CoroutineBasedSession)
  157. register_session_implement(ThreadBasedSession)
  158. RequestHandler = yield cdn_url, abs_base
  159. handlers = []
  160. if static_dir is not None:
  161. handlers.append((r"/static/(.*)", StaticFileHandler, {"path": static_dir}))
  162. if not cdn:
  163. handlers.append((r"/_pywebio_static/(.*)", StaticFileHandler, {"path": STATIC_PATH}))
  164. handlers.append((r"/.*", RequestHandler))
  165. print('Listen on %s:%s' % (host or '0.0.0.0', port))
  166. set_ioloop(tornado.ioloop.IOLoop.current()) # to enable bokeh app
  167. app = tornado.web.Application(handlers=handlers, **tornado_app_settings)
  168. app.listen(port, address=host, max_buffer_size=max_payload_size)
  169. tornado.ioloop.IOLoop.current().start()
  170. def path_deploy(base, port=0, host='',
  171. index=True, static_dir=None,
  172. reconnect_timeout=0,
  173. cdn=True, debug=False,
  174. allowed_origins=None, check_origin=None,
  175. max_payload_size='200M',
  176. **tornado_app_settings):
  177. """Deploy the PyWebIO applications from a directory.
  178. The server communicates with the browser using WebSocket protocol.
  179. :param str base: Base directory to load PyWebIO application.
  180. :param int port: The port the server listens on.
  181. :param str host: The host the server listens on.
  182. :param bool/callable index: Whether to provide a default index page when request a directory, default is ``True``.
  183. ``index`` also accepts a function to custom index page, which receives the requested directory path as parameter
  184. and return HTML content in string.
  185. You can override the index page by add a `index.py` PyWebIO app file to the directory.
  186. :param str static_dir: Directory to store the application static files.
  187. The files in this directory can be accessed via ``http://<host>:<port>/static/files``.
  188. For example, if there is a ``A/B.jpg`` file in ``static_dir`` path,
  189. it can be accessed via ``http://<host>:<port>/static/A/B.jpg``.
  190. :param int reconnect_timeout: The client can reconnect to server within ``reconnect_timeout`` seconds after an unexpected disconnection.
  191. If set to 0 (default), once the client disconnects, the server session will be closed.
  192. The rest arguments of ``path_deploy()`` have the same meaning as for :func:`pywebio.platform.tornado.start_server`
  193. """
  194. utils.MAX_PAYLOAD_SIZE = max_payload_size = parse_file_size(max_payload_size)
  195. # Since some cloud server may close idle connections (such as heroku),
  196. # use `websocket_ping_interval` to keep the connection alive
  197. tornado_app_settings.setdefault('websocket_ping_interval', 30)
  198. tornado_app_settings.setdefault('websocket_max_message_size', max_payload_size) # Backward compatible
  199. tornado_app_settings['websocket_max_message_size'] = parse_file_size(tornado_app_settings['websocket_max_message_size'])
  200. gen = _path_deploy(base, port=port, host=host,
  201. static_dir=static_dir,
  202. cdn=cdn, debug=debug,
  203. max_payload_size=max_payload_size,
  204. **tornado_app_settings)
  205. cdn_url, abs_base = next(gen)
  206. index_func = {True: partial(default_index_page, base=abs_base), False: lambda p: '403 Forbidden'}.get(index, index)
  207. Handler = webio_handler(lambda: None, cdn_url, allowed_origins=allowed_origins,
  208. check_origin=check_origin, reconnect_timeout=reconnect_timeout)
  209. class WSHandler(Handler):
  210. def get_app(self):
  211. reload = self.get_query_argument('reload', None) is not None
  212. type, res = get_app_from_path(self.request.path, abs_base, index=index_func, reload=reload)
  213. if type == 'error':
  214. raise HTTPError(status_code=res)
  215. elif type == 'html':
  216. raise Finish(res)
  217. app_name = self.get_query_argument('app', 'index')
  218. app = res.get(app_name) or res['index']
  219. return app
  220. gen.send(WSHandler)
  221. gen.close()
  222. def path_deploy_http(base, port=0, host='',
  223. index=True, static_dir=None,
  224. cdn=True, debug=False,
  225. allowed_origins=None, check_origin=None,
  226. session_expire_seconds=None,
  227. session_cleanup_interval=None,
  228. max_payload_size='200M',
  229. **tornado_app_settings):
  230. """Deploy the PyWebIO applications from a directory.
  231. The server communicates with the browser using HTTP protocol.
  232. The ``base``, ``port``, ``host``, ``index``, ``static_dir`` arguments of ``path_deploy_http()``
  233. have the same meaning as for :func:`pywebio.platform.path_deploy`
  234. The rest arguments of ``path_deploy_http()`` have the same meaning as for :func:`pywebio.platform.tornado_http.start_server`
  235. """
  236. utils.MAX_PAYLOAD_SIZE = max_payload_size = parse_file_size(max_payload_size)
  237. gen = _path_deploy(base, port=port, host=host,
  238. static_dir=static_dir,
  239. cdn=cdn, debug=debug,
  240. max_payload_size=max_payload_size,
  241. **tornado_app_settings)
  242. cdn_url, abs_base = next(gen)
  243. index_func = {True: partial(default_index_page, base=abs_base), False: lambda p: '403 Forbidden'}.get(index, index)
  244. def get_app(context: TornadoHttpContext):
  245. reload = context.request_url_parameter('reload', None) is not None
  246. type, res = get_app_from_path(context.get_path(), abs_base, index=index_func, reload=reload)
  247. if type == 'error':
  248. raise HTTPError(status_code=res)
  249. elif type == 'html':
  250. raise Finish(res)
  251. app_name = context.request_url_parameter('app', 'index')
  252. return res.get(app_name) or res['index']
  253. handler = HttpHandler(app_loader=get_app, cdn=cdn_url,
  254. session_expire_seconds=session_expire_seconds,
  255. session_cleanup_interval=session_cleanup_interval,
  256. allowed_origins=allowed_origins,
  257. check_origin=check_origin)
  258. class ReqHandler(tornado.web.RequestHandler):
  259. def options(self):
  260. return self.get()
  261. def post(self):
  262. return self.get()
  263. def get(self):
  264. context = TornadoHttpContext(self)
  265. self.write(handler.handle_request(context))
  266. gen.send(ReqHandler)
  267. gen.close()