X-Git-Url: https://arthur.barton.de/cgi-bin/gitweb.cgi?a=blobdiff_plain;f=cmd%2Fweb-cmd.py;h=eeb9107d3e93e19e98c2c1bb61a7cf68d571d82b;hb=6b6559e405d264d4127211b935b21a3dda93ad93;hp=29523158ee0882065ceeb39322423781dabedb80;hpb=98805befbcccd27869d9f5f70132a3e847477d75;p=bup.git

diff --git a/cmd/web-cmd.py b/cmd/web-cmd.py
index 2952315..eeb9107 100755
--- a/cmd/web-cmd.py
+++ b/cmd/web-cmd.py
@@ -1,137 +1,195 @@
-#!/usr/bin/env python
-import sys, stat, cgi, shutil, urllib, mimetypes, posixpath
-import BaseHTTPServer
+#!/bin/sh
+"""": # -*-python-*-
+bup_python="$(dirname "$0")/bup-python" || exit $?
+exec "$bup_python" "$0" ${1+"$@"}
+"""
+# end of bup preamble
+
+from __future__ import absolute_import, print_function
+from collections import namedtuple
+import mimetypes, os, posixpath, signal, stat, sys, time, urllib, webbrowser
+
 from bup import options, git, vfs
-from bup.helpers import *
+from bup.helpers import (chunkyreader, debug1, format_filesize, handle_ctrl_c,
+                         log, saved_errors)
+from bup.metadata import Metadata
+from bup.path import resource_path
+from bup.repo import LocalRepo
+
 try:
-    from cStringIO import StringIO
+    from tornado import gen
+    from tornado.httpserver import HTTPServer
+    from tornado.ioloop import IOLoop
+    from tornado.netutil import bind_unix_socket
+    import tornado.web
 except ImportError:
-    from StringIO import StringIO
+    log('error: cannot find the python "tornado" module; please install it\n')
+    sys.exit(1)
+
+
+# FIXME: right now the way hidden files are handled causes every
+# directory to be traversed twice.
 
 handle_ctrl_c()
 
-class BupHTTPServer(BaseHTTPServer.HTTPServer):
-    def handle_error(self, request, client_address):
-        # If we get a KeyboardInterrupt error than just reraise it
-        # so that we cause the server to exit.
-        if sys.exc_info()[0] == KeyboardInterrupt:
-            raise
 
-class BupRequestHandler(BaseHTTPServer.BaseHTTPRequestHandler):
-    server_version = 'BupHTTP/%s' % version_tag()
-    protocol_version = 'HTTP/1.1'
-    def do_GET(self):
-        self._process_request()
+def http_date_from_utc_ns(utc_ns):
+    return time.strftime('%a, %d %b %Y %H:%M:%S', time.gmtime(utc_ns / 10**9))
 
-    def do_HEAD(self):
-        self._process_request()
 
-    def _process_request(self):
-        """Common code for GET and HEAD commands.
+def _compute_breadcrumbs(path, show_hidden=False):
+    """Returns a list of breadcrumb objects for a path."""
+    breadcrumbs = []
+    breadcrumbs.append(('[root]', '/'))
+    path_parts = path.split('/')[1:-1]
+    full_path = '/'
+    for part in path_parts:
+        full_path += part + "/"
+        url_append = ""
+        if show_hidden:
+            url_append = '?hidden=1'
+        breadcrumbs.append((part, full_path+url_append))
+    return breadcrumbs
 
-        This sends the response code and MIME headers along with the content
-        of the response.
-        """
-        path = urllib.unquote(self.path)
-        try:
-            n = top.resolve(path)
-        except vfs.NoSuchFile:
+
+def _contains_hidden_files(repo, dir_item):
+    """Return true if the directory contains items with names other than
+    '.' and '..' that begin with '.'
+
+    """
+    for name, item in vfs.contents(repo, dir_item, want_meta=False):
+        if name in ('.', '..'):
+            continue
+        if name.startswith('.'):
+            return True
+    return False
+
+
+def _dir_contents(repo, resolution, show_hidden=False):
+    """Yield the display information for the contents of dir_item."""
+
+    url_query = '?hidden=1' if show_hidden else ''
+
+    def display_info(name, item, resolved_item, display_name=None):
+        # link should be based on fully resolved type to avoid extra
+        # HTTP redirect.
+        if stat.S_ISDIR(vfs.item_mode(resolved_item)):
+            link = urllib.quote(name) + '/'
+        else:
+            link = urllib.quote(name)
+
+        size = vfs.item_size(repo, item)
+        if opt.human_readable:
+            display_size = format_filesize(size)
+        else:
+            display_size = size
+
+        if not display_name:
+            mode = vfs.item_mode(item)
+            if stat.S_ISDIR(mode):
+                display_name = name + '/'
+            elif stat.S_ISLNK(mode):
+                display_name = name + '@'
+            else:
+                display_name = name
+
+        return display_name, link + url_query, display_size
+
+    dir_item = resolution[-1][1]    
+    for name, item in vfs.contents(repo, dir_item):
+        if not show_hidden:
+            if (name not in ('.', '..')) and name.startswith('.'):
+                continue
+        if name == '.':
+            yield display_info(name, item, item, '.')
+            parent_item = resolution[-2][1] if len(resolution) > 1 else dir_item
+            yield display_info('..', parent_item, parent_item, '..')
+            continue
+        res = vfs.try_resolve(repo, name, parent=resolution, want_meta=False)
+        res_name, res_item = res[-1]
+        yield display_info(name, item, res_item)
+
+
+class BupRequestHandler(tornado.web.RequestHandler):
+
+    def initialize(self, repo=None):
+        self.repo = repo
+
+    def decode_argument(self, value, name=None):
+        if name == 'path':
+            return value
+        return super(BupRequestHandler, self).decode_argument(value, name)
+
+    def get(self, path):
+        return self._process_request(path)
+
+    def head(self, path):
+        return self._process_request(path)
+    
+    def _process_request(self, path):
+        path = urllib.unquote(path)
+        print('Handling request for %s' % path)
+        # Set want_meta because dir metadata won't be fetched, and if
+        # it's not a dir, then we're going to want the metadata.
+        res = vfs.resolve(self.repo, path, want_meta=True)
+        leaf_name, leaf_item = res[-1]
+        if not leaf_item:
             self.send_error(404)
             return
-        f = None
-        if stat.S_ISDIR(n.mode):
-            self._list_directory(path, n)
+        mode = vfs.item_mode(leaf_item)
+        if stat.S_ISDIR(mode):
+            self._list_directory(path, res)
         else:
-            self._get_file(path, n)
+            self._get_file(self.repo, path, res)
 
-    def _list_directory(self, path, n):
+    def _list_directory(self, path, resolution):
         """Helper to produce a directory listing.
 
         Return value is either a file object, or None (indicating an
         error).  In either case, the headers are sent.
         """
-        if not path.endswith('/'):
-            # redirect browser - doing basically what apache does
-            self.send_response(301)
-            self.send_header("Location", path + "/")
-            self.send_header("Content-Length", 0)
-            self.end_headers()
-            return
+        if not path.endswith('/') and len(path) > 0:
+            print('Redirecting from %s to %s' % (path, path + '/'))
+            return self.redirect(path + '/', permanent=True)
 
-        # Note that it is necessary to buffer the output into a StringIO here
-        # so that we can compute the content length before we send the
-        # content.  The only other option would be to do chunked encoding, or
-        # not support content length.
-        f = StringIO()
-        displaypath = cgi.escape(path)
-        f.write("""
-<HTML>
-  <HEAD>
-    <TITLE>Directory listing for %(displaypath)s</TITLE>
-    <STYLE>
-      BODY, TABLE { font-family: sans-serif }
-      .dir-name { text-align: left }
-      .dir-size { text-align: right }
-    </STYLE>
-  </HEAD>
-  <BODY>
-    <H2>Directory listing for %(displaypath)s</H2>
-    <TABLE>
-      <TR>
-        <TH class=dir-name>Name</TH>
-        <TH class=dir-size>Size<TH>
-      </TR>
-""" % { 'displaypath': displaypath })
-        for sub in n:
-            displayname = linkname = sub.name
-            # Append / for directories or @ for symbolic links
-            size = str(sub.size())
-            if stat.S_ISDIR(sub.mode):
-                displayname = sub.name + "/"
-                linkname = sub.name + "/"
-                size = '&nbsp;'
-            if stat.S_ISLNK(sub.mode):
-                displayname = sub.name + "@"
-                # Note: a link to a directory displays with @ and links with /
-                size = '&nbsp;'
-            f.write("""      <TR>
-        <TD class=dir-name><A href="%s">%s</A></TD>
-        <TD class=dir-size>%s</TD>
-      </TR>""" % (urllib.quote(linkname), cgi.escape(displayname), size))
-        f.write("""
-    </UL>
-  </BODY>
-</HTML>""")
-        length = f.tell()
-        f.seek(0)
-        self.send_response(200)
-        self.send_header("Content-type", "text/html")
-        self.send_header("Content-Length", str(length))
-        self.end_headers()
-        self._send_content(f)
-        f.close()
-
-    def _get_file(self, path, n):
+        hidden_arg = self.request.arguments.get('hidden', [0])[-1]
+        try:
+            show_hidden = int(hidden_arg)
+        except ValueError as e:
+            show_hidden = False
+
+        self.render(
+            'list-directory.html',
+            path=path,
+            breadcrumbs=_compute_breadcrumbs(path, show_hidden),
+            files_hidden=_contains_hidden_files(self.repo, resolution[-1][1]),
+            hidden_shown=show_hidden,
+            dir_contents=_dir_contents(self.repo, resolution,
+                                       show_hidden=show_hidden))
+
+    @gen.coroutine
+    def _get_file(self, repo, path, resolved):
         """Process a request on a file.
 
         Return value is either a file object, or None (indicating an error).
         In either case, the headers are sent.
         """
+        file_item = resolved[-1][1]
+        file_item = vfs.augment_item_meta(repo, file_item, include_size=True)
+        meta = file_item.meta
         ctype = self._guess_type(path)
-        f = n.open()
-        self.send_response(200)
-        self.send_header("Content-type", ctype)
-        self.send_header("Content-Length", str(n.size()))
-        self.send_header("Last-Modified", self.date_time_string(n.mtime))
-        self.end_headers()
-        self._send_content(f)
-        f.close()
-
-    def _send_content(self, f):
-        """Send the content file as the response if necessary."""
-        if self.command != 'HEAD':
-            for blob in chunkyreader(f):
-                self.wfile.write(blob)
+        self.set_header("Last-Modified", http_date_from_utc_ns(meta.mtime))
+        self.set_header("Content-Type", ctype)
+        
+        self.set_header("Content-Length", str(meta.size))
+        assert len(file_item.oid) == 20
+        self.set_header("Etag", file_item.oid.encode('hex'))
+        if self.request.method != 'HEAD':
+            with vfs.fopen(self.repo, file_item) as f:
+                it = chunkyreader(f)
+                for blob in chunkyreader(f):
+                    self.write(blob)
+        raise gen.Return()
 
     def _guess_type(self, path):
         """Guess the type of a file.
@@ -166,31 +224,93 @@ class BupRequestHandler(BaseHTTPServer.BaseHTTPRequestHandler):
         })
 
 
+io_loop = None
+
+def handle_sigterm(signum, frame):
+    global io_loop
+    debug1('\nbup-web: signal %d received\n' % signum)
+    log('Shutdown requested\n')
+    if not io_loop:
+        sys.exit(0)
+    io_loop.stop()
+
+
+signal.signal(signal.SIGTERM, handle_sigterm)
+
+UnixAddress = namedtuple('UnixAddress', ['path'])
+InetAddress = namedtuple('InetAddress', ['host', 'port'])
+
 optspec = """
 bup web [[hostname]:port]
+bup web unix://path
 --
+human-readable    display human readable file sizes (i.e. 3.9K, 4.7M)
+browser           show repository in default browser (incompatible with unix://)
 """
-o = options.Options('bup web', optspec)
+o = options.Options(optspec)
 (opt, flags, extra) = o.parse(sys.argv[1:])
 
 if len(extra) > 1:
     o.fatal("at most one argument expected")
 
-address = ('127.0.0.1', 8080)
-if len(extra) > 0:
-    addressl = extra[0].split(':', 1)
-    addressl[1] = int(addressl[1])
-    address = tuple(addressl)
+if len(extra) == 0:
+    address = InetAddress(host='127.0.0.1', port=8080)
+else:
+    bind_url = extra[0]
+    if bind_url.startswith('unix://'):
+        address = UnixAddress(path=bind_url[len('unix://'):])
+    else:
+        addr_parts = extra[0].split(':', 1)
+        if len(addr_parts) == 1:
+            host = '127.0.0.1'
+            port = addr_parts[0]
+        else:
+            host, port = addr_parts
+        try:
+            port = int(port)
+        except (TypeError, ValueError) as ex:
+            o.fatal('port must be an integer, not %r', port)
+        address = InetAddress(host=host, port=port)
 
 git.check_repo_or_die()
-top = vfs.RefList(None)
 
-try:
-    httpd = BupHTTPServer(address, BupRequestHandler)
-except socket.error, e:
-    log('socket%r: %s\n' % (address, e.args[1]))
+settings = dict(
+    debug = 1,
+    template_path = resource_path('web'),
+    static_path = resource_path('web/static')
+)
+
+# Disable buffering on stdout, for debug messages
+sys.stdout = os.fdopen(sys.stdout.fileno(), 'w', 0)
+
+application = tornado.web.Application([
+    (r"(?P<path>/.*)", BupRequestHandler, dict(repo=LocalRepo())),
+], **settings)
+
+http_server = HTTPServer(application)
+io_loop_pending = IOLoop.instance()
+
+if isinstance(address, InetAddress):
+    http_server.listen(address.port, address.host)
+    try:
+        sock = http_server._socket # tornado < 2.0
+    except AttributeError as e:
+        sock = http_server._sockets.values()[0]
+    print('Serving HTTP on %s:%d...' % sock.getsockname())
+    if opt.browser:
+        browser_addr = 'http://' + address[0] + ':' + str(address[1])
+        io_loop_pending.add_callback(lambda : webbrowser.open(browser_addr))
+elif isinstance(address, UnixAddress):
+    unix_socket = bind_unix_socket(address.path)
+    http_server.add_socket(unix_socket)
+    print('Serving HTTP on filesystem socket %r' % address.path)
+else:
+    log('error: unexpected address %r', address)
     sys.exit(1)
 
-sa = httpd.socket.getsockname()
-log("Serving HTTP on %s:%d...\n" % sa)
-httpd.serve_forever()
+io_loop = io_loop_pending
+io_loop.start()
+
+if saved_errors:
+    log('WARNING: %d errors encountered while saving.\n' % len(saved_errors))
+    sys.exit(1)