1
0

path_deploy.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344
  1. import os.path
  2. from functools import partial
  3. from contextlib import contextmanager
  4. import ast
  5. import tornado
  6. from tornado import template
  7. from tornado.web import HTTPError, Finish
  8. from tornado.web import StaticFileHandler
  9. from . import utils
  10. from .httpbased import HttpHandler
  11. from .tornado import webio_handler, set_ioloop
  12. from .tornado_http import TornadoHttpContext
  13. from .utils import cdn_validation, make_applications
  14. from ..session import register_session_implement, CoroutineBasedSession, ThreadBasedSession
  15. from ..utils import get_free_port, STATIC_PATH, parse_file_size
  16. def filename_ok(f):
  17. return not f.startswith(('.', '_'))
  18. def identifiers_info(code):
  19. """Get the identifiers and theirs docstring from python source code.
  20. :return dict:
  21. """
  22. try:
  23. tree = ast.parse(code)
  24. except Exception:
  25. return {}
  26. if not isinstance(tree, ast.Module):
  27. return {}
  28. identifier2doc = {}
  29. for node in tree.body:
  30. if isinstance(node, ast.Assign):
  31. for name in node.targets:
  32. identifier2doc[name.id] = ''
  33. elif isinstance(node, (ast.FunctionDef, ast.AsyncFunctionDef, ast.ClassDef)):
  34. doc_string = ast.get_docstring(node) or ''
  35. title = doc_string.split('\n\n')[0]
  36. identifier2doc[node.name] = title
  37. return identifier2doc
  38. def valid_and_norm_path(base, subpath):
  39. """Join the sub-path to base path. This function always ensure the result path is a subpath of base path.
  40. :param str base: MUST a absolute path
  41. :param str subpath: sub-path under the `base` path
  42. :return: normalized result path. None returned if the sub path is not valid
  43. """
  44. subpath = subpath.lstrip('/')
  45. full_path = os.path.normpath(os.path.join(base, subpath))
  46. if not full_path.startswith(base):
  47. return None
  48. parts = subpath.split('/')
  49. for i in parts:
  50. if not filename_ok(i):
  51. return None
  52. return full_path
  53. _cached_modules = {}
  54. def _get_module(path, reload=False):
  55. # https://docs.python.org/3/library/importlib.html#importing-a-source-file-directly
  56. # https://stackoverflow.com/questions/41861427/python-3-5-how-to-dynamically-import-a-module-given-the-full-file-path-in-the
  57. global _cached_modules
  58. import importlib.util
  59. @contextmanager
  60. def add_to_path(p):
  61. import sys
  62. sys.path.append(p)
  63. try:
  64. yield
  65. finally:
  66. sys.path.remove(p)
  67. if not reload and path in _cached_modules:
  68. return _cached_modules[path]
  69. # import_name will be the `__name__` of the imported module
  70. import_name = "__pywebio__"
  71. with add_to_path(os.path.dirname(path)):
  72. spec = importlib.util.spec_from_file_location(import_name, path, submodule_search_locations=None)
  73. module = importlib.util.module_from_spec(spec)
  74. spec.loader.exec_module(module)
  75. _cached_modules[path] = module
  76. return module
  77. _app_list_tpl = template.Template("""
  78. <!DOCTYPE html>
  79. <html lang="">
  80. <head>
  81. <meta charset="UTF-8">
  82. <meta name="viewport" content="width=device-width, initial-scale=1, shrink-to-fit=no">
  83. <title>{{ title }}</title>
  84. <meta name="description" content="PyWebIO applications index">
  85. <style>a{text-decoration:none;display:inline-block;min-width:{{ max_name_width }}ch}span{color:grey}</style>
  86. </head>
  87. <body>
  88. <h1>{{ title }}</h1>
  89. <hr>
  90. <pre style="line-height: 1.6em; font-size: 16px;">
  91. {% for name,doc in files %} <a href="{{ name }}">{{ name }}</a> <span>{{ doc }}</span>
  92. {% end %}</pre>
  93. <hr>
  94. </body>
  95. </html>
  96. """.strip())
  97. def default_index_page(path, base):
  98. urlpath = path[len(base):] or '/'
  99. title = "Index of %s" % urlpath
  100. dirs = [] if path == base else [('../', '')] # (name, doc)
  101. files = [] # (name, doc)
  102. for f in os.listdir(path):
  103. if not filename_ok(f):
  104. continue
  105. full_path = os.path.join(path, f)
  106. if os.path.isfile(full_path):
  107. if f.endswith('.py'):
  108. code = open(full_path, encoding='utf8').read()
  109. identifiers = identifiers_info(code)
  110. if 'main' in identifiers:
  111. files.append([f[:-3], identifiers['main']])
  112. else:
  113. dirs.append([(f + '/'), ''])
  114. items = dirs + files
  115. max_name_width = max([len(n) for n, _ in items]+[0])
  116. return _app_list_tpl.generate(files=items, title=title, max_name_width=max_name_width)
  117. def get_app_from_path(request_path, base, index, reload=False):
  118. """Get PyWebIO app
  119. :param str request_path: request path
  120. :param str base: dir base path, MUST a absolute path
  121. :param callable index:
  122. :return: ('error', http error code in int) / ('app', pywebio task function) / ('html', Html content in bytes)
  123. """
  124. path = valid_and_norm_path(base, request_path)
  125. if path is None:
  126. return 'error', 403
  127. if os.path.isdir(path):
  128. if not request_path.endswith('/'):
  129. return 'error', 404
  130. if os.path.isfile(os.path.join(path, 'index.py')):
  131. path = os.path.join(path, 'index.py')
  132. elif index:
  133. content = index(path)
  134. return 'html', content
  135. else:
  136. return 'error', 404
  137. else:
  138. path += '.py'
  139. if not os.path.isfile(path):
  140. return 'error', 404
  141. module = _get_module(path, reload=reload)
  142. if hasattr(module, 'main'):
  143. return 'app', make_applications(module.main)
  144. return 'error', 404
  145. def _path_deploy(base, port=0, host='', static_dir=None, cdn=True, max_payload_size=2 ** 20 * 200,
  146. **tornado_app_settings):
  147. if not host:
  148. host = '0.0.0.0'
  149. if port == 0:
  150. port = get_free_port()
  151. tornado_app_settings = {k: v for k, v in tornado_app_settings.items() if v is not None}
  152. abs_base = os.path.normpath(os.path.abspath(base))
  153. cdn = cdn_validation(cdn, 'warn', stacklevel=4) # if CDN is not available, warn user and disable CDN
  154. cdn_url = '/_pywebio_static/' if not cdn else cdn
  155. register_session_implement(CoroutineBasedSession)
  156. register_session_implement(ThreadBasedSession)
  157. RequestHandler = yield cdn_url, abs_base
  158. handlers = []
  159. if static_dir is not None:
  160. handlers.append((r"/static/(.*)", StaticFileHandler, {"path": static_dir}))
  161. if not cdn:
  162. handlers.append((r"/_pywebio_static/(.*)", StaticFileHandler, {"path": STATIC_PATH}))
  163. handlers.append((r"/.*", RequestHandler))
  164. print('Listen on %s:%s' % (host or '0.0.0.0', port))
  165. set_ioloop(tornado.ioloop.IOLoop.current()) # to enable bokeh app
  166. app = tornado.web.Application(handlers=handlers, **tornado_app_settings)
  167. app.listen(port, address=host, max_buffer_size=max_payload_size)
  168. tornado.ioloop.IOLoop.current().start()
  169. def path_deploy(base, port=0, host='',
  170. index=True, static_dir=None,
  171. reconnect_timeout=0,
  172. cdn=True, debug=True,
  173. allowed_origins=None, check_origin=None,
  174. max_payload_size='200M',
  175. **tornado_app_settings):
  176. """Deploy the PyWebIO applications from a directory.
  177. The server communicates with the browser using WebSocket protocol.
  178. :param str base: Base directory to load PyWebIO application.
  179. :param int port: The port the server listens on.
  180. :param str host: The host the server listens on.
  181. :param bool/callable index: Whether to provide a default index page when request a directory, default is ``True``.
  182. ``index`` also accepts a function to custom index page, which receives the requested directory path as parameter
  183. and return HTML content in string.
  184. You can override the index page by add a `index.py` PyWebIO app file to the directory.
  185. :param str static_dir: Directory to store the application static files.
  186. The files in this directory can be accessed via ``http://<host>:<port>/static/files``.
  187. For example, if there is a ``A/B.jpg`` file in ``static_dir`` path,
  188. it can be accessed via ``http://<host>:<port>/static/A/B.jpg``.
  189. :param int reconnect_timeout: The client can reconnect to server within ``reconnect_timeout`` seconds after an unexpected disconnection.
  190. If set to 0 (default), once the client disconnects, the server session will be closed.
  191. The rest arguments of ``path_deploy()`` have the same meaning as for :func:`pywebio.platform.tornado.start_server`
  192. """
  193. utils.MAX_PAYLOAD_SIZE = max_payload_size = parse_file_size(max_payload_size)
  194. # Since some cloud server may close idle connections (such as heroku),
  195. # use `websocket_ping_interval` to keep the connection alive
  196. tornado_app_settings.setdefault('websocket_ping_interval', 30)
  197. tornado_app_settings.setdefault('websocket_max_message_size', max_payload_size) # Backward compatible
  198. tornado_app_settings['websocket_max_message_size'] = parse_file_size(tornado_app_settings['websocket_max_message_size'])
  199. gen = _path_deploy(base, port=port, host=host,
  200. static_dir=static_dir,
  201. cdn=cdn, debug=debug,
  202. max_payload_size=max_payload_size,
  203. **tornado_app_settings)
  204. cdn_url, abs_base = next(gen)
  205. index_func = {True: partial(default_index_page, base=abs_base), False: lambda p: '403 Forbidden'}.get(index, index)
  206. Handler = webio_handler(lambda: None, cdn_url, allowed_origins=allowed_origins,
  207. check_origin=check_origin, reconnect_timeout=reconnect_timeout)
  208. class WSHandler(Handler):
  209. def get_app(self):
  210. reload = self.get_query_argument('reload', None) is not None
  211. type, res = get_app_from_path(self.request.path, abs_base, index=index_func, reload=reload)
  212. if type == 'error':
  213. raise HTTPError(status_code=res)
  214. elif type == 'html':
  215. raise Finish(res)
  216. app_name = self.get_query_argument('app', 'index')
  217. app = res.get(app_name) or res['index']
  218. return app
  219. gen.send(WSHandler)
  220. gen.close()
  221. def path_deploy_http(base, port=0, host='',
  222. index=True, static_dir=None,
  223. cdn=True, debug=True,
  224. allowed_origins=None, check_origin=None,
  225. session_expire_seconds=None,
  226. session_cleanup_interval=None,
  227. max_payload_size='200M',
  228. **tornado_app_settings):
  229. """Deploy the PyWebIO applications from a directory.
  230. The server communicates with the browser using HTTP protocol.
  231. The ``base``, ``port``, ``host``, ``index``, ``static_dir`` arguments of ``path_deploy_http()``
  232. have the same meaning as for :func:`pywebio.platform.path_deploy`
  233. The rest arguments of ``path_deploy_http()`` have the same meaning as for :func:`pywebio.platform.tornado_http.start_server`
  234. """
  235. utils.MAX_PAYLOAD_SIZE = max_payload_size = parse_file_size(max_payload_size)
  236. gen = _path_deploy(base, port=port, host=host,
  237. static_dir=static_dir,
  238. cdn=cdn, debug=debug,
  239. max_payload_size=max_payload_size,
  240. **tornado_app_settings)
  241. cdn_url, abs_base = next(gen)
  242. index_func = {True: partial(default_index_page, base=abs_base), False: lambda p: '403 Forbidden'}.get(index, index)
  243. def get_app(context: TornadoHttpContext):
  244. reload = context.request_url_parameter('reload', None) is not None
  245. type, res = get_app_from_path(context.get_path(), abs_base, index=index_func, reload=reload)
  246. if type == 'error':
  247. raise HTTPError(status_code=res)
  248. elif type == 'html':
  249. raise Finish(res)
  250. app_name = context.request_url_parameter('app', 'index')
  251. return res.get(app_name) or res['index']
  252. handler = HttpHandler(app_loader=get_app, cdn=cdn_url,
  253. session_expire_seconds=session_expire_seconds,
  254. session_cleanup_interval=session_cleanup_interval,
  255. allowed_origins=allowed_origins,
  256. check_origin=check_origin)
  257. class ReqHandler(tornado.web.RequestHandler):
  258. def options(self):
  259. return self.get()
  260. def post(self):
  261. return self.get()
  262. def get(self):
  263. context = TornadoHttpContext(self)
  264. self.write(handler.handle_request(context))
  265. gen.send(ReqHandler)
  266. gen.close()