datasette/app.py
2017-10-23 19:25:48 -07:00

188 lines
5.1 KiB
Python

from sanic import Sanic
from sanic import response
from sanic.exceptions import NotFound
from sanic.views import HTTPMethodView
from sanic_jinja2 import SanicJinja2
import sqlite3
from pathlib import Path
from functools import wraps
import json
import hashlib
app_root = Path(__file__).parent
BUILD_METADATA = 'build-metadata.json'
DB_GLOBS = ('*.db', '*.sqlite', '*.sqlite3')
HASH_BLOCK_SIZE = 1024 * 1024
conns = {}
app = Sanic(__name__)
jinja = SanicJinja2(app)
def get_conn(name):
if name not in conns:
info = ensure_build_metadata()[name]
conns[name] = sqlite3.connect(
'file:{}?immutable=1'.format(info['file']),
uri=True
)
conns[name].row_factory = sqlite3.Row
return conns[name]
def ensure_build_metadata(regenerate=False):
build_metadata = app_root / BUILD_METADATA
if build_metadata.exists() and not regenerate:
json.loads(build_metadata.read_text())
metadata = {}
for glob in DB_GLOBS:
for path in app_root.glob(glob):
name = path.stem
if name in metadata:
raise Exception('Multiple files with same stem %s' % name)
# Calculate hash, efficiently
m = hashlib.sha256()
with path.open('rb') as fp:
while True:
data = fp.read(HASH_BLOCK_SIZE)
if not data:
break
m.update(data)
# List tables and their row counts
tables = {}
with sqlite3.connect('file:{}?immutable=1'.format(path.name), uri=True) as conn:
conn.row_factory = sqlite3.Row
table_names = [
r['name']
for r in conn.execute('select * from sqlite_master where type="table"')
]
for table in table_names:
tables[table] = conn.execute('select count(*) from "{}"'.format(table)).fetchone()[0]
metadata[name] = {
'hash': m.hexdigest(),
'file': path.name,
'tables': tables,
}
build_metadata.write_text(json.dumps(metadata, indent=4))
return metadata
class BaseView(HTTPMethodView):
template = None
async def get(self, request, db_name, **kwargs):
name, hash, should_redirect = resolve_db_name(db_name)
if should_redirect:
return response.redirect(should_redirect)
try:
as_json = kwargs.pop('as_json')
except KeyError:
as_json = False
data = self.data(request, name, hash, **kwargs)
if as_json:
return response.json(data)
else:
return jinja.render(
self.template,
request,
**data,
)
def sqlerrors(fn):
@wraps(fn)
async def inner(*args, **kwargs):
try:
return await fn(*args, **kwargs)
except sqlite3.OperationalError as e:
return response.json({
'ok': False,
'error': str(e),
})
return inner
@app.route('/')
@sqlerrors
async def index(request, sql=None):
databases = ensure_build_metadata(True)
return jinja.render(
'index.html',
request,
databases=databases,
)
@app.route('/favicon.ico')
async def favicon(request):
return response.text('')
class DatabaseView(BaseView):
template = 'database.html'
def data(self, request, name, hash):
conn = get_conn(name)
rows = conn.execute('select * from sqlite_master')
columns = [r[0] for r in rows.description]
return {
'database': name,
'database_hash': hash,
'rows': rows,
'columns': columns,
}
class TableView(BaseView):
template = 'table.html'
def data(self, request, name, hash, table):
conn = get_conn(name)
rows = conn.execute('select * from {} limit 20'.format(table))
columns = [r[0] for r in rows.description]
return {
'database': name,
'database_hash': hash,
'table': table,
'rows': rows,
'columns': columns,
}
app.add_route(DatabaseView.as_view(), '/<db_name:[^/]+?><as_json:(.json)?$>')
app.add_route(TableView.as_view(), '/<db_name:[^/]+>/<table:[^/]+?><as_json:(.json)?$>')
def resolve_db_name(db_name):
databases = ensure_build_metadata()
hash = None
name = None
if '-' in db_name:
# Might be name-and-hash, or might just be
# a name with a hyphen in it
name, hash = db_name.rsplit('-', 1)
if name not in databases:
# Try the whole name
name = db_name
hash = None
else:
name = db_name
# Verify the hash
try:
info = databases[name]
except KeyError:
raise NotFound()
expected = info['hash'][:7]
if expected != hash:
return name, expected, '/{}-{}'.format(
name, expected,
)
return name, expected, None
if __name__ == '__main__':
app.run(host="0.0.0.0", port=8006)