2014-05-31 04:01:21 +08:00
|
|
|
"""A contents manager that uses the local file system for storage."""
|
2011-08-18 04:21:19 +08:00
|
|
|
|
2014-04-28 06:54:31 +08:00
|
|
|
# Copyright (c) IPython Development Team.
|
|
|
|
# Distributed under the terms of the Modified BSD License.
|
2011-08-05 04:55:04 +08:00
|
|
|
|
2014-06-03 04:47:11 +08:00
|
|
|
import base64
|
2014-11-12 09:18:55 +08:00
|
|
|
import errno
|
2012-01-31 05:43:48 +08:00
|
|
|
import io
|
2011-08-05 04:55:04 +08:00
|
|
|
import os
|
2013-04-10 04:49:10 +08:00
|
|
|
import shutil
|
2014-11-12 09:18:55 +08:00
|
|
|
from contextlib import contextmanager
|
2014-11-06 08:11:29 +08:00
|
|
|
import mimetypes
|
2013-07-04 01:35:30 +08:00
|
|
|
|
2011-08-05 04:55:04 +08:00
|
|
|
from tornado import web
|
|
|
|
|
2014-05-31 04:01:21 +08:00
|
|
|
from .manager import ContentsManager
|
2014-10-24 06:35:01 +08:00
|
|
|
from IPython import nbformat
|
2014-08-05 02:22:42 +08:00
|
|
|
from IPython.utils.io import atomic_writing
|
2014-04-28 06:54:31 +08:00
|
|
|
from IPython.utils.path import ensure_dir_exists
|
2014-03-01 03:38:28 +08:00
|
|
|
from IPython.utils.traitlets import Unicode, Bool, TraitError
|
2014-11-12 09:18:55 +08:00
|
|
|
from IPython.utils.py3compat import getcwd, str_to_unicode
|
2013-07-04 03:16:22 +08:00
|
|
|
from IPython.utils import tz
|
2014-11-12 09:18:55 +08:00
|
|
|
from IPython.html.utils import is_hidden, to_os_path, to_api_path
|
2011-08-05 04:55:04 +08:00
|
|
|
|
|
|
|
|
2014-05-31 04:01:21 +08:00
|
|
|
class FileContentsManager(ContentsManager):
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-11-18 04:01:20 +08:00
|
|
|
root_dir = Unicode(config=True)
|
|
|
|
|
|
|
|
def _root_dir_default(self):
|
2014-11-18 05:39:58 +08:00
|
|
|
try:
|
|
|
|
return self.parent.notebook_dir
|
|
|
|
except AttributeError:
|
|
|
|
return getcwd()
|
2014-11-12 09:18:55 +08:00
|
|
|
|
|
|
|
@contextmanager
|
|
|
|
def perm_to_403(self, os_path=''):
|
|
|
|
"""context manager for turning permission errors into 403"""
|
|
|
|
try:
|
|
|
|
yield
|
|
|
|
except OSError as e:
|
|
|
|
if e.errno in {errno.EPERM, errno.EACCES}:
|
|
|
|
# make 403 error message without root prefix
|
|
|
|
# this may not work perfectly on unicode paths on Python 2,
|
|
|
|
# but nobody should be doing that anyway.
|
|
|
|
if not os_path:
|
|
|
|
os_path = str_to_unicode(e.filename or 'unknown file')
|
|
|
|
path = to_api_path(os_path, self.root_dir)
|
|
|
|
raise web.HTTPError(403, u'Permission denied: %s' % path)
|
|
|
|
else:
|
|
|
|
raise
|
|
|
|
|
|
|
|
@contextmanager
|
|
|
|
def open(self, os_path, *args, **kwargs):
|
|
|
|
"""wrapper around io.open that turns permission errors into 403"""
|
|
|
|
with self.perm_to_403(os_path):
|
|
|
|
with io.open(os_path, *args, **kwargs) as f:
|
|
|
|
yield f
|
|
|
|
|
|
|
|
@contextmanager
|
2014-11-19 05:02:00 +08:00
|
|
|
def atomic_writing(self, os_path, *args, **kwargs):
|
2014-11-12 09:18:55 +08:00
|
|
|
"""wrapper around atomic_writing that turns permission errors into 403"""
|
|
|
|
with self.perm_to_403(os_path):
|
|
|
|
with atomic_writing(os_path, *args, **kwargs) as f:
|
|
|
|
yield f
|
|
|
|
|
2014-07-30 05:01:27 +08:00
|
|
|
save_script = Bool(False, config=True, help='DEPRECATED, IGNORED')
|
|
|
|
def _save_script_changed(self):
|
|
|
|
self.log.warn("""
|
|
|
|
Automatically saving notebooks as scripts has been removed.
|
|
|
|
Use `ipython nbconvert --to python [notebook]` instead.
|
|
|
|
""")
|
|
|
|
|
2014-05-31 04:01:21 +08:00
|
|
|
def _root_dir_changed(self, name, old, new):
|
|
|
|
"""Do a bit of validation of the root_dir."""
|
2014-02-13 15:03:43 +08:00
|
|
|
if not os.path.isabs(new):
|
|
|
|
# If we receive a non-absolute path, make it absolute.
|
2014-05-31 04:01:21 +08:00
|
|
|
self.root_dir = os.path.abspath(new)
|
2014-02-13 15:03:43 +08:00
|
|
|
return
|
2014-07-30 05:01:27 +08:00
|
|
|
if not os.path.isdir(new):
|
2014-05-31 04:01:21 +08:00
|
|
|
raise TraitError("%r is not a directory" % new)
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-04-24 02:44:29 +08:00
|
|
|
checkpoint_dir = Unicode('.ipynb_checkpoints', config=True,
|
2014-06-17 03:47:00 +08:00
|
|
|
help="""The directory name in which to keep file checkpoints
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-06-17 03:47:00 +08:00
|
|
|
This is a path relative to the file's own directory.
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-04-24 02:44:29 +08:00
|
|
|
By default, it is .ipynb_checkpoints
|
2013-04-10 04:49:10 +08:00
|
|
|
"""
|
|
|
|
)
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-03-15 01:05:30 +08:00
|
|
|
def _copy(self, src, dest):
|
|
|
|
"""copy src to dest
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-03-20 03:21:55 +08:00
|
|
|
like shutil.copy2, but log errors in copystat
|
2014-03-15 01:05:30 +08:00
|
|
|
"""
|
2014-03-20 03:21:55 +08:00
|
|
|
shutil.copyfile(src, dest)
|
|
|
|
try:
|
|
|
|
shutil.copystat(src, dest)
|
|
|
|
except OSError as e:
|
|
|
|
self.log.debug("copystat on %s failed", dest, exc_info=True)
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-11-11 05:46:51 +08:00
|
|
|
def _get_os_path(self, path):
|
|
|
|
"""Given an API path, return its file system path.
|
2014-06-03 04:47:11 +08:00
|
|
|
|
|
|
|
Parameters
|
|
|
|
----------
|
|
|
|
path : string
|
2014-07-23 05:39:54 +08:00
|
|
|
The relative API path to the named file.
|
2014-06-03 04:47:11 +08:00
|
|
|
|
|
|
|
Returns
|
|
|
|
-------
|
|
|
|
path : string
|
2014-10-23 04:13:36 +08:00
|
|
|
Native, absolute OS path to for a file.
|
2014-06-03 04:47:11 +08:00
|
|
|
"""
|
|
|
|
return to_os_path(path, self.root_dir)
|
2013-07-13 00:15:08 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def dir_exists(self, path):
|
2014-06-03 04:47:11 +08:00
|
|
|
"""Does the API-style path refer to an extant directory?
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-07-23 05:39:54 +08:00
|
|
|
API-style wrapper for os.path.isdir
|
|
|
|
|
2013-10-08 03:38:34 +08:00
|
|
|
Parameters
|
|
|
|
----------
|
|
|
|
path : string
|
|
|
|
The path to check. This is an API path (`/` separated,
|
2014-05-31 04:01:21 +08:00
|
|
|
relative to root_dir).
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2013-10-08 03:38:34 +08:00
|
|
|
Returns
|
|
|
|
-------
|
|
|
|
exists : bool
|
|
|
|
Whether the path is indeed a directory.
|
|
|
|
"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2014-02-13 15:03:43 +08:00
|
|
|
os_path = self._get_os_path(path=path)
|
2013-10-08 03:38:34 +08:00
|
|
|
return os.path.isdir(os_path)
|
2014-02-06 05:09:55 +08:00
|
|
|
|
|
|
|
def is_hidden(self, path):
|
|
|
|
"""Does the API style path correspond to a hidden directory or file?
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-02-06 05:09:55 +08:00
|
|
|
Parameters
|
|
|
|
----------
|
|
|
|
path : string
|
|
|
|
The path to check. This is an API path (`/` separated,
|
2014-05-31 04:01:21 +08:00
|
|
|
relative to root_dir).
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-02-06 05:09:55 +08:00
|
|
|
Returns
|
|
|
|
-------
|
2014-10-23 04:13:36 +08:00
|
|
|
hidden : bool
|
|
|
|
Whether the path exists and is hidden.
|
2014-02-06 05:09:55 +08:00
|
|
|
"""
|
|
|
|
path = path.strip('/')
|
2014-02-13 15:03:43 +08:00
|
|
|
os_path = self._get_os_path(path=path)
|
2014-05-31 04:01:21 +08:00
|
|
|
return is_hidden(os_path, self.root_dir)
|
2014-02-06 05:09:55 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def file_exists(self, path):
|
2014-06-03 04:47:11 +08:00
|
|
|
"""Returns True if the file exists, else returns False.
|
2013-10-08 03:38:34 +08:00
|
|
|
|
2014-07-23 05:39:54 +08:00
|
|
|
API-style wrapper for os.path.isfile
|
|
|
|
|
2013-10-08 03:38:34 +08:00
|
|
|
Parameters
|
|
|
|
----------
|
|
|
|
path : string
|
2014-10-23 04:13:36 +08:00
|
|
|
The relative path to the file (with '/' as separator)
|
2013-10-08 03:38:34 +08:00
|
|
|
|
|
|
|
Returns
|
|
|
|
-------
|
2014-07-23 05:39:54 +08:00
|
|
|
exists : bool
|
|
|
|
Whether the file exists.
|
2013-10-08 03:38:34 +08:00
|
|
|
"""
|
2014-06-03 04:47:11 +08:00
|
|
|
path = path.strip('/')
|
2014-11-11 05:46:51 +08:00
|
|
|
os_path = self._get_os_path(path)
|
|
|
|
return os.path.isfile(os_path)
|
2013-10-08 03:38:34 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def exists(self, path):
|
|
|
|
"""Returns True if the path exists, else returns False.
|
2013-08-27 02:18:34 +08:00
|
|
|
|
2014-07-23 05:39:54 +08:00
|
|
|
API-style wrapper for os.path.exists
|
|
|
|
|
2013-08-14 04:40:51 +08:00
|
|
|
Parameters
|
|
|
|
----------
|
|
|
|
path : string
|
2014-10-23 04:13:36 +08:00
|
|
|
The API path to the file (with '/' as separator)
|
2013-08-27 02:18:34 +08:00
|
|
|
|
2013-08-14 04:40:51 +08:00
|
|
|
Returns
|
|
|
|
-------
|
2014-07-23 05:39:54 +08:00
|
|
|
exists : bool
|
|
|
|
Whether the target exists.
|
2013-08-14 04:40:51 +08:00
|
|
|
"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2014-10-23 04:13:36 +08:00
|
|
|
os_path = self._get_os_path(path=path)
|
2014-06-03 04:47:11 +08:00
|
|
|
return os.path.exists(os_path)
|
2013-07-04 01:35:30 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def _base_model(self, path):
|
2014-06-03 04:47:11 +08:00
|
|
|
"""Build the common base of a contents model"""
|
2014-10-23 04:13:36 +08:00
|
|
|
os_path = self._get_os_path(path)
|
2014-02-03 07:50:57 +08:00
|
|
|
info = os.stat(os_path)
|
|
|
|
last_modified = tz.utcfromtimestamp(info.st_mtime)
|
|
|
|
created = tz.utcfromtimestamp(info.st_ctime)
|
2014-06-17 03:47:00 +08:00
|
|
|
# Create the base model.
|
2014-06-03 04:47:11 +08:00
|
|
|
model = {}
|
2014-10-23 04:13:36 +08:00
|
|
|
model['name'] = path.rsplit('/', 1)[-1]
|
2014-02-03 07:50:57 +08:00
|
|
|
model['path'] = path
|
|
|
|
model['last_modified'] = last_modified
|
|
|
|
model['created'] = created
|
2014-06-03 04:47:11 +08:00
|
|
|
model['content'] = None
|
|
|
|
model['format'] = None
|
2014-11-06 08:11:29 +08:00
|
|
|
model['mimetype'] = None
|
2014-11-12 09:18:55 +08:00
|
|
|
try:
|
|
|
|
model['writable'] = os.access(os_path, os.W_OK)
|
|
|
|
except OSError:
|
|
|
|
self.log.error("Failed to check write permissions on %s", os_path)
|
|
|
|
model['writable'] = False
|
2014-06-03 04:47:11 +08:00
|
|
|
return model
|
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def _dir_model(self, path, content=True):
|
2014-06-03 04:47:11 +08:00
|
|
|
"""Build a model for a directory
|
|
|
|
|
|
|
|
if content is requested, will include a listing of the directory
|
|
|
|
"""
|
2014-10-23 04:13:36 +08:00
|
|
|
os_path = self._get_os_path(path)
|
2014-06-03 04:47:11 +08:00
|
|
|
|
2014-11-12 09:18:55 +08:00
|
|
|
four_o_four = u'directory does not exist: %r' % path
|
2014-07-30 05:01:27 +08:00
|
|
|
|
2014-06-03 04:47:11 +08:00
|
|
|
if not os.path.isdir(os_path):
|
2014-07-30 05:01:27 +08:00
|
|
|
raise web.HTTPError(404, four_o_four)
|
2014-06-03 04:47:11 +08:00
|
|
|
elif is_hidden(os_path, self.root_dir):
|
2014-07-30 05:01:27 +08:00
|
|
|
self.log.info("Refusing to serve hidden directory %r, via 404 Error",
|
|
|
|
os_path
|
|
|
|
)
|
|
|
|
raise web.HTTPError(404, four_o_four)
|
2014-06-03 04:47:11 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
model = self._base_model(path)
|
2014-02-03 07:50:57 +08:00
|
|
|
model['type'] = 'directory'
|
2014-06-03 04:47:11 +08:00
|
|
|
if content:
|
2014-06-17 03:47:00 +08:00
|
|
|
model['content'] = contents = []
|
2014-11-11 05:46:51 +08:00
|
|
|
os_dir = self._get_os_path(path)
|
|
|
|
for name in os.listdir(os_dir):
|
|
|
|
os_path = os.path.join(os_dir, name)
|
2014-08-27 00:12:54 +08:00
|
|
|
# skip over broken symlinks in listing
|
|
|
|
if not os.path.exists(os_path):
|
|
|
|
self.log.warn("%s doesn't exist", os_path)
|
|
|
|
continue
|
2014-11-11 05:46:51 +08:00
|
|
|
elif not os.path.isfile(os_path) and not os.path.isdir(os_path):
|
|
|
|
self.log.debug("%s not a regular file", os_path)
|
|
|
|
continue
|
2014-06-03 04:47:11 +08:00
|
|
|
if self.should_list(name) and not is_hidden(os_path, self.root_dir):
|
2014-11-12 06:51:21 +08:00
|
|
|
contents.append(self.get(
|
2014-10-23 04:13:36 +08:00
|
|
|
path='%s/%s' % (path, name),
|
|
|
|
content=False)
|
|
|
|
)
|
2014-06-03 04:47:11 +08:00
|
|
|
|
2014-06-04 02:35:45 +08:00
|
|
|
model['format'] = 'json'
|
2014-06-03 04:47:11 +08:00
|
|
|
|
2014-02-03 07:50:57 +08:00
|
|
|
return model
|
|
|
|
|
2014-11-12 06:20:56 +08:00
|
|
|
def _file_model(self, path, content=True, format=None):
|
2014-06-03 04:47:11 +08:00
|
|
|
"""Build a model for a file
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-06-03 04:47:11 +08:00
|
|
|
if content is requested, include the file contents.
|
2014-11-12 06:20:56 +08:00
|
|
|
|
|
|
|
format:
|
|
|
|
If 'text', the contents will be decoded as UTF-8.
|
|
|
|
If 'base64', the raw bytes contents will be encoded as base64.
|
|
|
|
If not specified, try to decode as UTF-8, and fall back to base64
|
2014-06-03 04:47:11 +08:00
|
|
|
"""
|
2014-10-23 04:13:36 +08:00
|
|
|
model = self._base_model(path)
|
2014-06-03 04:47:11 +08:00
|
|
|
model['type'] = 'file'
|
2014-11-06 08:11:29 +08:00
|
|
|
|
|
|
|
os_path = self._get_os_path(path)
|
|
|
|
model['mimetype'] = mimetypes.guess_type(os_path)[0] or 'text/plain'
|
|
|
|
|
2014-06-03 04:47:11 +08:00
|
|
|
if content:
|
2014-11-11 05:46:51 +08:00
|
|
|
if not os.path.isfile(os_path):
|
|
|
|
# could be FIFO
|
|
|
|
raise web.HTTPError(400, "Cannot get content of non-file %s" % os_path)
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.open(os_path, 'rb') as f:
|
2014-07-30 05:01:27 +08:00
|
|
|
bcontent = f.read()
|
2014-11-12 06:20:56 +08:00
|
|
|
|
|
|
|
if format != 'base64':
|
|
|
|
try:
|
|
|
|
model['content'] = bcontent.decode('utf8')
|
|
|
|
except UnicodeError as e:
|
|
|
|
if format == 'text':
|
|
|
|
raise web.HTTPError(400, "%s is not UTF-8 encoded" % path)
|
|
|
|
else:
|
|
|
|
model['format'] = 'text'
|
|
|
|
|
|
|
|
if model['content'] is None:
|
2014-07-30 05:01:27 +08:00
|
|
|
model['content'] = base64.encodestring(bcontent).decode('ascii')
|
|
|
|
model['format'] = 'base64'
|
2014-11-12 06:20:56 +08:00
|
|
|
|
2014-06-03 04:47:11 +08:00
|
|
|
return model
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-06-03 04:47:11 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def _notebook_model(self, path, content=True):
|
2014-06-03 04:47:11 +08:00
|
|
|
"""Build a notebook model
|
|
|
|
|
|
|
|
if content is requested, the notebook content will be populated
|
|
|
|
as a JSON structure (not double-serialized)
|
2013-08-28 11:16:29 +08:00
|
|
|
"""
|
2014-10-23 04:13:36 +08:00
|
|
|
model = self._base_model(path)
|
2014-06-03 04:47:11 +08:00
|
|
|
model['type'] = 'notebook'
|
|
|
|
if content:
|
2014-10-23 04:13:36 +08:00
|
|
|
os_path = self._get_os_path(path)
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.open(os_path, 'r', encoding='utf-8') as f:
|
2014-06-03 04:47:11 +08:00
|
|
|
try:
|
2014-10-24 06:35:01 +08:00
|
|
|
nb = nbformat.read(f, as_version=4)
|
2014-06-03 04:47:11 +08:00
|
|
|
except Exception as e:
|
2014-09-11 05:22:01 +08:00
|
|
|
raise web.HTTPError(400, u"Unreadable Notebook: %s %r" % (os_path, e))
|
2014-10-23 04:13:36 +08:00
|
|
|
self.mark_trusted_cells(nb, path)
|
2014-06-03 04:47:11 +08:00
|
|
|
model['content'] = nb
|
|
|
|
model['format'] = 'json'
|
2014-09-11 08:09:42 +08:00
|
|
|
self.validate_notebook_model(model)
|
2014-06-03 04:47:11 +08:00
|
|
|
return model
|
2013-08-27 02:18:34 +08:00
|
|
|
|
2014-11-12 06:51:21 +08:00
|
|
|
def get(self, path, content=True, type_=None, format=None):
|
2014-10-23 04:13:36 +08:00
|
|
|
""" Takes a path for an entity and returns its model
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2013-08-28 11:16:29 +08:00
|
|
|
Parameters
|
|
|
|
----------
|
|
|
|
path : str
|
2014-07-23 05:39:54 +08:00
|
|
|
the API path that describes the relative path for the target
|
2014-11-12 04:17:36 +08:00
|
|
|
content : bool
|
|
|
|
Whether to include the contents in the reply
|
|
|
|
type_ : str, optional
|
|
|
|
The requested type - 'file', 'notebook', or 'directory'.
|
2014-11-12 06:46:53 +08:00
|
|
|
Will raise HTTPError 400 if the content doesn't match.
|
2014-11-12 06:20:56 +08:00
|
|
|
format : str, optional
|
|
|
|
The requested format for file contents. 'text' or 'base64'.
|
|
|
|
Ignored if this returns a notebook or directory model.
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2013-08-28 11:16:29 +08:00
|
|
|
Returns
|
|
|
|
-------
|
|
|
|
model : dict
|
2014-06-03 04:47:11 +08:00
|
|
|
the contents model. If content=True, returns the contents
|
|
|
|
of the file or directory as well.
|
2013-08-28 11:16:29 +08:00
|
|
|
"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2014-06-03 04:47:11 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
if not self.exists(path):
|
|
|
|
raise web.HTTPError(404, u'No such file or directory: %s' % path)
|
2014-06-03 04:47:11 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
os_path = self._get_os_path(path)
|
2014-06-03 04:47:11 +08:00
|
|
|
if os.path.isdir(os_path):
|
2014-11-12 04:17:36 +08:00
|
|
|
if type_ not in (None, 'directory'):
|
|
|
|
raise web.HTTPError(400,
|
|
|
|
u'%s is a directory, not a %s' % (path, type_))
|
2014-10-23 04:13:36 +08:00
|
|
|
model = self._dir_model(path, content=content)
|
2014-11-12 04:17:36 +08:00
|
|
|
elif type_ == 'notebook' or (type_ is None and path.endswith('.ipynb')):
|
2014-10-23 04:13:36 +08:00
|
|
|
model = self._notebook_model(path, content=content)
|
2014-06-03 04:47:11 +08:00
|
|
|
else:
|
2014-11-12 04:17:36 +08:00
|
|
|
if type_ == 'directory':
|
|
|
|
raise web.HTTPError(400,
|
|
|
|
u'%s is not a directory')
|
2014-11-12 06:20:56 +08:00
|
|
|
model = self._file_model(path, content=content, format=format)
|
2013-08-27 02:18:34 +08:00
|
|
|
return model
|
2013-07-13 00:15:08 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def _save_notebook(self, os_path, model, path=''):
|
2014-06-17 03:47:00 +08:00
|
|
|
"""save a notebook file"""
|
2014-06-04 02:35:45 +08:00
|
|
|
# Save the notebook file
|
2014-10-24 06:35:01 +08:00
|
|
|
nb = nbformat.from_dict(model['content'])
|
2014-06-04 02:35:45 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
self.check_and_sign(nb, path)
|
2014-06-04 02:35:45 +08:00
|
|
|
|
2014-11-19 05:02:00 +08:00
|
|
|
with self.atomic_writing(os_path, encoding='utf-8') as f:
|
2014-10-31 00:36:47 +08:00
|
|
|
nbformat.write(nb, f, version=nbformat.NO_CONVERT)
|
2014-06-04 02:35:45 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def _save_file(self, os_path, model, path=''):
|
2014-06-17 03:47:00 +08:00
|
|
|
"""save a non-notebook file"""
|
2014-06-04 02:35:45 +08:00
|
|
|
fmt = model.get('format', None)
|
|
|
|
if fmt not in {'text', 'base64'}:
|
|
|
|
raise web.HTTPError(400, "Must specify format of file contents as 'text' or 'base64'")
|
|
|
|
try:
|
|
|
|
content = model['content']
|
|
|
|
if fmt == 'text':
|
|
|
|
bcontent = content.encode('utf8')
|
|
|
|
else:
|
|
|
|
b64_bytes = content.encode('ascii')
|
|
|
|
bcontent = base64.decodestring(b64_bytes)
|
|
|
|
except Exception as e:
|
|
|
|
raise web.HTTPError(400, u'Encoding error saving %s: %s' % (os_path, e))
|
2014-11-19 05:02:00 +08:00
|
|
|
with self.atomic_writing(os_path, text=False) as f:
|
2014-06-04 02:35:45 +08:00
|
|
|
f.write(bcontent)
|
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def _save_directory(self, os_path, model, path=''):
|
2014-06-17 03:47:00 +08:00
|
|
|
"""create a directory"""
|
2014-07-30 05:01:27 +08:00
|
|
|
if is_hidden(os_path, self.root_dir):
|
|
|
|
raise web.HTTPError(400, u'Cannot create hidden directory %r' % os_path)
|
2014-06-04 02:35:45 +08:00
|
|
|
if not os.path.exists(os_path):
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.perm_to_403():
|
|
|
|
os.mkdir(os_path)
|
2014-06-04 02:35:45 +08:00
|
|
|
elif not os.path.isdir(os_path):
|
|
|
|
raise web.HTTPError(400, u'Not a directory: %s' % (os_path))
|
2014-07-30 05:01:27 +08:00
|
|
|
else:
|
|
|
|
self.log.debug("Directory %r already exists", os_path)
|
2014-06-04 02:35:45 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def save(self, model, path=''):
|
2014-06-04 02:35:45 +08:00
|
|
|
"""Save the file model and return the model with no content."""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2013-08-27 02:18:34 +08:00
|
|
|
|
2014-06-04 02:35:45 +08:00
|
|
|
if 'type' not in model:
|
|
|
|
raise web.HTTPError(400, u'No file type provided')
|
2014-07-01 01:50:07 +08:00
|
|
|
if 'content' not in model and model['type'] != 'directory':
|
|
|
|
raise web.HTTPError(400, u'No file content provided')
|
2014-02-06 04:01:11 +08:00
|
|
|
|
2013-10-24 01:37:49 +08:00
|
|
|
# One checkpoint should always exist
|
2014-10-23 04:13:36 +08:00
|
|
|
if self.file_exists(path) and not self.list_checkpoints(path):
|
|
|
|
self.create_checkpoint(path)
|
2013-08-27 02:18:34 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
os_path = self._get_os_path(path)
|
2014-06-04 02:35:45 +08:00
|
|
|
self.log.debug("Saving %s", os_path)
|
2011-08-05 04:55:04 +08:00
|
|
|
try:
|
2014-06-04 02:35:45 +08:00
|
|
|
if model['type'] == 'notebook':
|
2014-10-23 04:13:36 +08:00
|
|
|
self._save_notebook(os_path, model, path)
|
2014-06-04 02:35:45 +08:00
|
|
|
elif model['type'] == 'file':
|
2014-10-23 04:13:36 +08:00
|
|
|
self._save_file(os_path, model, path)
|
2014-06-04 02:35:45 +08:00
|
|
|
elif model['type'] == 'directory':
|
2014-10-23 04:13:36 +08:00
|
|
|
self._save_directory(os_path, model, path)
|
2014-06-04 02:35:45 +08:00
|
|
|
else:
|
|
|
|
raise web.HTTPError(400, "Unhandled contents type: %s" % model['type'])
|
|
|
|
except web.HTTPError:
|
|
|
|
raise
|
2011-12-13 13:09:42 +08:00
|
|
|
except Exception as e:
|
2014-11-12 09:18:55 +08:00
|
|
|
self.log.error(u'Error while saving file: %s %s', path, e, exc_info=True)
|
|
|
|
raise web.HTTPError(500, u'Unexpected error while saving file: %s %s' % (path, e))
|
2012-06-27 07:15:42 +08:00
|
|
|
|
2014-09-11 08:09:42 +08:00
|
|
|
validation_message = None
|
|
|
|
if model['type'] == 'notebook':
|
|
|
|
self.validate_notebook_model(model)
|
|
|
|
validation_message = model.get('message', None)
|
|
|
|
|
2014-11-12 06:51:21 +08:00
|
|
|
model = self.get(path, content=False)
|
2014-09-11 08:09:42 +08:00
|
|
|
if validation_message:
|
|
|
|
model['message'] = validation_message
|
2013-08-27 02:18:34 +08:00
|
|
|
return model
|
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def update(self, model, path):
|
|
|
|
"""Update the file's path
|
2014-07-23 05:39:54 +08:00
|
|
|
|
|
|
|
For use in PATCH requests, to enable renaming a file without
|
|
|
|
re-uploading its contents. Only used for renaming at the moment.
|
|
|
|
"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
|
|
|
new_path = model.get('path', path).strip('/')
|
2014-10-23 04:13:36 +08:00
|
|
|
if path != new_path:
|
|
|
|
self.rename(path, new_path)
|
2014-11-12 06:51:21 +08:00
|
|
|
model = self.get(new_path, content=False)
|
2013-08-27 02:18:34 +08:00
|
|
|
return model
|
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def delete(self, path):
|
|
|
|
"""Delete file at path."""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2014-10-23 04:13:36 +08:00
|
|
|
os_path = self._get_os_path(path)
|
2014-06-17 03:47:35 +08:00
|
|
|
rm = os.unlink
|
|
|
|
if os.path.isdir(os_path):
|
|
|
|
listing = os.listdir(os_path)
|
|
|
|
# don't delete non-empty directories (checkpoints dir doesn't count)
|
2014-07-30 05:01:27 +08:00
|
|
|
if listing and listing != [self.checkpoint_dir]:
|
2014-06-17 03:47:35 +08:00
|
|
|
raise web.HTTPError(400, u'Directory %s not empty' % os_path)
|
|
|
|
elif not os.path.isfile(os_path):
|
2014-05-31 04:01:21 +08:00
|
|
|
raise web.HTTPError(404, u'File does not exist: %s' % os_path)
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2013-04-10 04:49:10 +08:00
|
|
|
# clear checkpoints
|
2014-10-23 04:13:36 +08:00
|
|
|
for checkpoint in self.list_checkpoints(path):
|
2013-10-18 05:45:25 +08:00
|
|
|
checkpoint_id = checkpoint['id']
|
2014-10-23 04:13:36 +08:00
|
|
|
cp_path = self.get_checkpoint_path(checkpoint_id, path)
|
2013-08-27 02:18:34 +08:00
|
|
|
if os.path.isfile(cp_path):
|
|
|
|
self.log.debug("Unlinking checkpoint %s", cp_path)
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.perm_to_403():
|
|
|
|
rm(cp_path)
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-06-17 03:47:35 +08:00
|
|
|
if os.path.isdir(os_path):
|
|
|
|
self.log.debug("Removing directory %s", os_path)
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.perm_to_403():
|
|
|
|
shutil.rmtree(os_path)
|
2014-06-17 03:47:35 +08:00
|
|
|
else:
|
|
|
|
self.log.debug("Unlinking file %s", os_path)
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.perm_to_403():
|
|
|
|
rm(os_path)
|
2011-08-05 04:55:04 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def rename(self, old_path, new_path):
|
2014-05-31 04:01:21 +08:00
|
|
|
"""Rename a file."""
|
2013-10-09 02:39:03 +08:00
|
|
|
old_path = old_path.strip('/')
|
|
|
|
new_path = new_path.strip('/')
|
2014-10-23 04:13:36 +08:00
|
|
|
if new_path == old_path:
|
2013-08-27 02:18:34 +08:00
|
|
|
return
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
new_os_path = self._get_os_path(new_path)
|
|
|
|
old_os_path = self._get_os_path(old_path)
|
2013-08-27 02:18:34 +08:00
|
|
|
|
|
|
|
# Should we proceed with the move?
|
2014-11-11 05:46:51 +08:00
|
|
|
if os.path.exists(new_os_path):
|
|
|
|
raise web.HTTPError(409, u'File already exists: %s' % new_path)
|
2013-08-27 02:18:34 +08:00
|
|
|
|
2014-05-31 04:01:21 +08:00
|
|
|
# Move the file
|
2013-08-27 02:18:34 +08:00
|
|
|
try:
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.perm_to_403():
|
|
|
|
shutil.move(old_os_path, new_os_path)
|
|
|
|
except web.HTTPError:
|
|
|
|
raise
|
2013-08-28 12:53:01 +08:00
|
|
|
except Exception as e:
|
2014-11-11 05:46:51 +08:00
|
|
|
raise web.HTTPError(500, u'Unknown error renaming file: %s %s' % (old_path, e))
|
2013-08-27 02:18:34 +08:00
|
|
|
|
|
|
|
# Move the checkpoints
|
2014-10-23 04:13:36 +08:00
|
|
|
old_checkpoints = self.list_checkpoints(old_path)
|
2013-08-27 02:18:34 +08:00
|
|
|
for cp in old_checkpoints:
|
2013-10-18 05:45:25 +08:00
|
|
|
checkpoint_id = cp['id']
|
2014-10-23 04:13:36 +08:00
|
|
|
old_cp_path = self.get_checkpoint_path(checkpoint_id, old_path)
|
|
|
|
new_cp_path = self.get_checkpoint_path(checkpoint_id, new_path)
|
2013-08-27 02:18:34 +08:00
|
|
|
if os.path.isfile(old_cp_path):
|
|
|
|
self.log.debug("Renaming checkpoint %s -> %s", old_cp_path, new_cp_path)
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.perm_to_403():
|
|
|
|
shutil.move(old_cp_path, new_cp_path)
|
2013-08-27 02:18:34 +08:00
|
|
|
|
2013-04-10 04:49:10 +08:00
|
|
|
# Checkpoint-related utilities
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def get_checkpoint_path(self, checkpoint_id, path):
|
2013-08-27 02:18:34 +08:00
|
|
|
"""find the path to a checkpoint"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2014-10-23 04:13:36 +08:00
|
|
|
parent, name = ('/' + path).rsplit('/', 1)
|
|
|
|
parent = parent.strip('/')
|
2014-05-31 04:01:21 +08:00
|
|
|
basename, ext = os.path.splitext(name)
|
2013-05-29 02:47:05 +08:00
|
|
|
filename = u"{name}-{checkpoint_id}{ext}".format(
|
2013-10-24 01:37:08 +08:00
|
|
|
name=basename,
|
2013-04-10 04:49:10 +08:00
|
|
|
checkpoint_id=checkpoint_id,
|
2014-05-31 04:01:21 +08:00
|
|
|
ext=ext,
|
2013-04-10 04:49:10 +08:00
|
|
|
)
|
2014-10-23 04:13:36 +08:00
|
|
|
os_path = self._get_os_path(path=parent)
|
2014-04-24 02:44:29 +08:00
|
|
|
cp_dir = os.path.join(os_path, self.checkpoint_dir)
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.perm_to_403():
|
|
|
|
ensure_dir_exists(cp_dir)
|
2014-04-24 02:44:29 +08:00
|
|
|
cp_path = os.path.join(cp_dir, filename)
|
2013-08-27 02:18:34 +08:00
|
|
|
return cp_path
|
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def get_checkpoint_model(self, checkpoint_id, path):
|
2013-04-11 07:29:04 +08:00
|
|
|
"""construct the info dict for a given checkpoint"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2014-10-23 04:13:36 +08:00
|
|
|
cp_path = self.get_checkpoint_path(checkpoint_id, path)
|
2013-08-27 02:18:34 +08:00
|
|
|
stats = os.stat(cp_path)
|
2013-07-04 03:16:22 +08:00
|
|
|
last_modified = tz.utcfromtimestamp(stats.st_mtime)
|
2013-04-11 07:29:04 +08:00
|
|
|
info = dict(
|
2013-10-18 05:45:25 +08:00
|
|
|
id = checkpoint_id,
|
2013-04-11 07:29:04 +08:00
|
|
|
last_modified = last_modified,
|
|
|
|
)
|
|
|
|
return info
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2013-04-10 04:49:10 +08:00
|
|
|
# public checkpoint API
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def create_checkpoint(self, path):
|
2014-05-31 04:01:21 +08:00
|
|
|
"""Create a checkpoint from the current state of a file"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2014-11-11 05:46:51 +08:00
|
|
|
if not self.file_exists(path):
|
|
|
|
raise web.HTTPError(404)
|
2014-10-23 04:13:36 +08:00
|
|
|
src_path = self._get_os_path(path)
|
2013-04-11 07:29:04 +08:00
|
|
|
# only the one checkpoint ID:
|
2013-05-29 02:47:05 +08:00
|
|
|
checkpoint_id = u"checkpoint"
|
2014-10-23 04:13:36 +08:00
|
|
|
cp_path = self.get_checkpoint_path(checkpoint_id, path)
|
|
|
|
self.log.debug("creating checkpoint for %s", path)
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.perm_to_403():
|
|
|
|
self._copy(src_path, cp_path)
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2013-04-11 07:29:04 +08:00
|
|
|
# return the checkpoint info
|
2014-10-23 04:13:36 +08:00
|
|
|
return self.get_checkpoint_model(checkpoint_id, path)
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def list_checkpoints(self, path):
|
2014-05-31 04:01:21 +08:00
|
|
|
"""list the checkpoints for a given file
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-05-31 04:01:21 +08:00
|
|
|
This contents manager currently only supports one checkpoint per file.
|
2013-04-10 04:49:10 +08:00
|
|
|
"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2013-07-04 01:35:30 +08:00
|
|
|
checkpoint_id = "checkpoint"
|
2014-10-23 04:13:36 +08:00
|
|
|
os_path = self.get_checkpoint_path(checkpoint_id, path)
|
2014-04-24 02:44:29 +08:00
|
|
|
if not os.path.exists(os_path):
|
2013-04-10 04:49:10 +08:00
|
|
|
return []
|
2013-04-11 07:29:04 +08:00
|
|
|
else:
|
2014-10-23 04:13:36 +08:00
|
|
|
return [self.get_checkpoint_model(checkpoint_id, path)]
|
2014-05-31 03:39:11 +08:00
|
|
|
|
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def restore_checkpoint(self, checkpoint_id, path):
|
2014-05-31 04:01:21 +08:00
|
|
|
"""restore a file to a checkpointed state"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2014-10-23 04:13:36 +08:00
|
|
|
self.log.info("restoring %s from checkpoint %s", path, checkpoint_id)
|
|
|
|
nb_path = self._get_os_path(path)
|
|
|
|
cp_path = self.get_checkpoint_path(checkpoint_id, path)
|
2013-04-10 04:49:10 +08:00
|
|
|
if not os.path.isfile(cp_path):
|
2013-04-11 07:29:04 +08:00
|
|
|
self.log.debug("checkpoint file does not exist: %s", cp_path)
|
2013-04-10 04:49:10 +08:00
|
|
|
raise web.HTTPError(404,
|
2014-10-23 04:13:36 +08:00
|
|
|
u'checkpoint does not exist: %s@%s' % (path, checkpoint_id)
|
2013-04-10 04:49:10 +08:00
|
|
|
)
|
|
|
|
# ensure notebook is readable (never restore from an unreadable notebook)
|
2014-05-31 04:01:21 +08:00
|
|
|
if cp_path.endswith('.ipynb'):
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.open(cp_path, 'r', encoding='utf-8') as f:
|
2014-10-24 06:35:01 +08:00
|
|
|
nbformat.read(f, as_version=4)
|
2013-04-10 04:49:10 +08:00
|
|
|
self.log.debug("copying %s -> %s", cp_path, nb_path)
|
2014-11-12 09:18:55 +08:00
|
|
|
with self.perm_to_403():
|
|
|
|
self._copy(cp_path, nb_path)
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def delete_checkpoint(self, checkpoint_id, path):
|
2014-05-31 04:01:21 +08:00
|
|
|
"""delete a file's checkpoint"""
|
2013-10-09 02:39:03 +08:00
|
|
|
path = path.strip('/')
|
2014-10-23 04:13:36 +08:00
|
|
|
cp_path = self.get_checkpoint_path(checkpoint_id, path)
|
2013-08-27 02:18:34 +08:00
|
|
|
if not os.path.isfile(cp_path):
|
2013-04-10 04:49:10 +08:00
|
|
|
raise web.HTTPError(404,
|
2014-10-23 04:13:36 +08:00
|
|
|
u'Checkpoint does not exist: %s@%s' % (path, checkpoint_id)
|
2013-04-10 04:49:10 +08:00
|
|
|
)
|
2013-08-27 02:18:34 +08:00
|
|
|
self.log.debug("unlinking %s", cp_path)
|
|
|
|
os.unlink(cp_path)
|
2014-05-31 03:39:11 +08:00
|
|
|
|
2013-03-25 01:53:59 +08:00
|
|
|
def info_string(self):
|
2014-05-31 04:01:21 +08:00
|
|
|
return "Serving notebooks from local directory: %s" % self.root_dir
|
2014-03-30 05:39:15 +08:00
|
|
|
|
2014-10-23 04:13:36 +08:00
|
|
|
def get_kernel_path(self, path, model=None):
|
2014-05-31 04:01:21 +08:00
|
|
|
"""Return the initial working dir a kernel associated with a given notebook"""
|
2014-10-23 04:13:36 +08:00
|
|
|
if '/' in path:
|
2014-11-11 05:46:51 +08:00
|
|
|
parent_dir = path.rsplit('/', 1)[0]
|
2014-10-23 04:13:36 +08:00
|
|
|
else:
|
2014-11-11 05:46:51 +08:00
|
|
|
parent_dir = ''
|
|
|
|
return self._get_os_path(parent_dir)
|