Source code for pfio.cache.sparse_file

'''
A cache system for remote file system that stores cache as mmap'ed file locally

Of course, it's read only
'''

import fcntl
import io
import os
import shutil
import struct
import tempfile
from contextlib import contextmanager
from dataclasses import dataclass
from types import TracebackType
from typing import Optional, Tuple

from .file_cache import DummyLock, RWLock


@dataclass(frozen=True)
class _Range:
    start: int
    length: int
    cached: bool = False

    @staticmethod
    def size():
        return struct.calcsize('QLL')

    def overlap(self, rhs) -> bool:
        return (self.start - rhs.right) * (self.right - rhs.start) < 0

    @property
    def right(self):
        return self.start + self.length

    def includes(self, rhs) -> bool:
        return (self.start <= rhs.start) and (rhs.right <= self.right)

    def merge(self, rhs):
        assert self.overlap(rhs)
        assert self.cached == rhs.cached
        return _Range(min(self.start, rhs.start), max(self.right, rhs.right),
                      cached=self.cached)

    def pack(self):
        # Total 16 bytes
        # Q: unsigned long long: 8 bytes
        # L: unsigned long: 4 bytes
        # Upper bytes of cache is reserved for some other usage, maybe
        return struct.pack('QLL', self.start, self.cached, self.length)

    @staticmethod
    def unpack(buf):
        (s, c, l) = struct.unpack('QLL', buf)
        return _Range(start=s, cached=bool(c), length=l)


class _CachedWrapperBase:
    '''A transparent local cache for remote files base class

    TODO: add document here
    '''

    def __init__(self, fileobj, size, cachedir=None, close_on_close=False,
                 cache_size_limit=None, multithread_safe=False):
        self.fileobj = fileobj
        self.cachedir = cachedir
        self.cache_size_limit = cache_size_limit

        self.multithread_safe = multithread_safe
        if self.multithread_safe:
            self.lock = RWLock()
        else:
            self.lock = DummyLock()

        self.pos = 0
        self.size = size
        assert size > 0
        if cachedir is None:
            basedir = os.getenv('XDG_CACHE_HOME')
            if basedir is None:
                basedir = os.path.join(os.getenv('HOME'), ".cache")
            self.cachedir = os.path.join(basedir, "pfio")
        os.makedirs(self.cachedir, exist_ok=True)
        self.cachefp = tempfile.NamedTemporaryFile(delete=True,
                                                   dir=self.cachedir)

        # self.cachefp = open('cache.file', 'rwb')
        # self.cachefp = os.open('cache.file', os.O_RDWR|os.O_TRUNC)
        # TODO: make this tree if the size gets too long for O(n) scan
        self.ranges = [_Range(0, size)]
        self._closed = False
        self._frozen = False
        self.close_on_close = close_on_close

    def close(self):
        with self.lock.wrlock():
            if not self._closed:
                self._closed = True
                self.cachefp.close()
                if self.close_on_close:
                    self.fileobj.close()

    def preserve(self, dest):
        with self.lock.wrlock():
            # Hard link and save them
            try:
                os.link(self.cachefp.name, dest)
                self.cachefp.close()
            except OSError:
                # TODO: check errno to make sure handling the
                # 'different-drive' error.
                shutil.copyfile(self.cachefp.name, dest)

            self.cachefp = open(dest, 'rb')
            self._frozen = True

    def readline(self):
        raise NotImplementedError()

    def __enter__(self):
        return self

    def __exit__(self, exc_type: Optional[BaseException],
                 exc_value: Optional[BaseException],
                 traceback: Optional[TracebackType]):
        self.close()

    def flush(self):
        pass

    @property
    def closed(self):
        return self._closed

    def isatty(self):
        return False

    def readable(self):
        return True

    def seekable(self):
        return True

    def tell(self):
        return self.pos

    def truncate(self, size=None):
        raise io.UnsupportedOperation('truncate')

    def seek(self, pos, whence=io.SEEK_SET):
        with self.lock.wrlock():
            return self._seek(pos, whence)

    def _seek(self, pos, whence):
        # print(dir(self.fileobj))
        if whence in [0, io.SEEK_SET]:
            if pos < 0:
                raise OSError(22, "[Errno 22] Invalid argument")
        elif whence in [1, io.SEEK_CUR]:
            pos += self.pos
        elif whence in [2, io.SEEK_END]:
            pos += self.size
        else:
            raise ValueError('Wrong whence value: {}'.format(whence))

        if pos < 0:
            raise OSError(22, "[Errno 22] Invalid argument")
        self.pos = pos
        self.fileobj.seek(self.pos, io.SEEK_SET)
        return self.pos

    def writable(self):
        return False

    def write(self, data):
        raise io.UnsupportedOperation('not writable')

    def readall(self):
        return self.read(-1)

    def readinto(self, b):
        buf = self.read(len(b))
        b[:len(buf)] = buf
        return len(buf)

    def _read_all_cache(self):
        for r in self.ranges:
            if r.cached:
                data = os.pread(self.cachefp.fileno(), r.length, r.start)
                # print(r1, 'includes', r0, 'len(r0)?=', len(data))
                yield data, r
            else:
                yield None, r


class DynamicCachedWrapper(_CachedWrapperBase):
    '''Dynamic-page based local cache wrapper
    '''

    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)

    def read(self, size=-1) -> bytes:
        if size < 0:
            size = self.size - self.pos

        buf = bytearray(size)
        offset = 0
        with self.lock.wrlock():
            if self._closed:
                raise RuntimeError("closed")

            # TODO: unnecessary copy; optimize with os.readv?
            for data in self._read(size):
                buf[offset:offset+len(data)] = data
                offset += len(data)

            self.pos += len(buf)
            self.pos %= self.size
            if self.pos != self.fileobj.tell():
                self.fileobj.seek(self.pos, io.SEEK_SET)
            return bytes(buf)

    def _read(self, size):
        new_ranges = []
        streak = []
        for data, r in self._read2(size):
            if r.length > 0:
                if r.cached:
                    streak.append(r)
                else:
                    if streak:
                        start = streak[0].start
                        length = sum(s.length for s in streak)
                        new_ranges.append(_Range(start, length, cached=True))
                        streak = []
                    new_ranges.append(r)

            if data is not None:
                yield data

        if streak:
            start = streak[0].start
            length = sum(s.length for s in streak)
            new_ranges.append(_Range(start, length, cached=True))

        self.ranges = new_ranges

    def _read2(self, size):

        r0 = _Range(self.pos, size)
        # print("read =>", r0)
        for r1 in self.ranges:
            if not r1.overlap(r0):
                yield None, r1
                continue

            # [r0 [ ... r1] never happens as the first r1 always starts with 0
            assert r1.start <= r0.start

            # [r1 [ r0 ] ] r1 cached; prevent unnecessary area split
            if r1.includes(r0) and r1.cached:
                data = os.pread(self.cachefp.fileno(), r0.length, r0.start)
                # print(r1, 'includes', r0, 'len(r0)?=', len(data))
                yield data, r1
                continue

            yield None, _Range(r1.start, r0.start - r1.start, r1.cached)

            # [ r1 [ r0 ] ]
            if r0.right < r1.right:
                yield self._get_range(_Range(r0.start, r0.length, r1.cached))
                # print('[ r1 [ r0 ] ]', r, len(data))
                yield None, _Range(r0.right, r1.right - r0.right, r1.cached)
                continue

            # [ r1 [ ] r0 ]
            yield self._get_range(_Range(r0.start, r1.right - r0.start,
                                         r1.cached))
            # print('[ r1 [ ] r0 ]', r, len(data))

            r0 = _Range(r1.right, r0.right - r1.right)

    def _get_range(self, r: _Range) -> Tuple[bytes, _Range]:
        # print('get range:', r)
        if r.cached:
            return os.pread(self.cachefp.fileno(), r.length, r.start), r

        assert not self._frozen
        self.fileobj.seek(r.start, io.SEEK_SET)
        data = self.fileobj.read(r.length)
        written = os.pwrite(self.cachefp.fileno(), data, r.start)
        if written < 0:
            raise RuntimeError("bad file descriptor")
        # print(written, "/", r.length, "bytes written at", r.start)
        return data, _Range(r.start, r.length, True)



[docs]
class CachedWrapper(_CachedWrapperBase):
    '''A page-based transparent local cache for remote files

    This wrapper makes a transparent read-only local cache as sparse
    file.  The local cache behaves as read-mirror of remote file -
    when a known range is requested, it'll be local read. If it's not
    locally cached, it fetches the range and stores as local file.

    Example usage follows:

    .. code-block::

        from pfio.v2 import from_url
        from pfio.cache import SparseFileCache

        with from_url("s3://bucket/path-prefix/") as s3:
          large_file = "path/to/large/file"
          stat = s3.stat(large_file)
          with SparseFileCache(s3.open(large_file), stat.size,
                               close_on_close=True) as fp:
            fp.seek(1024)
            # Read file from 1024 to 1024+65536 and cache it
            data = fp.read(65536)


    It is internally used behind ZIP fs:

    .. code-block::

        from pfio.v2 import from_url

        with from_url("s3://bucket/your.zip", local_cache=True) as fs:
          with fs.open("file-in-zip.jpg", 'rb') as fp:
            data = rp.read()

    Arguments:

        multithread_safe (bool): Defines multithread safety. If this
            is ``True``, reader-writer locking system based on
            ``threading.Lock`` is introduced behind the cache
            management.

        cache_size_limit (int): Max size of the cache file. If the amount
            of cached data reaches this value, PFIO stops caching further
            data. The default value is ``None`` to indicate that no limit.


    '''

    def __init__(self, fileobj, size, cachedir=None, close_on_close=False,
                 pagesize=16*1024*1024, multithread_safe=False,
                 cache_size_limit=None):
        super().__init__(fileobj, size, cachedir, close_on_close,
                         cache_size_limit=cache_size_limit,
                         multithread_safe=multithread_safe)
        assert pagesize > 0
        self.pagesize = pagesize
        self.size = size
        self._init_ranges()

    def _init_ranges(self):
        self.cache_size = 0
        pagecount = self.size // self.pagesize
        self.ranges = [_Range(i * self.pagesize, self.pagesize, cached=False)
                       for i in range(pagecount)]

        remain = self.size % self.pagesize
        if remain > 0:
            r = _Range(pagecount*self.pagesize, remain, cached=False)
            self.ranges.append(r)

    def read(self, size=-1) -> bytes:
        with self.lock.wrlock():
            # TODO: it this giant lock becomes the bottleneck, split
            # this lock into per-page locks
            return self._read(size)

    def _is_full(self) -> bool:
        if self.cache_size_limit is None:
            return False
        return self.cache_size >= self.cache_size_limit

    def _read(self, size) -> bytes:
        if self._closed:
            raise RuntimeError("closed")

        if size < 0 or (self.size - self.pos < size):
            size = self.size - self.pos

        start = self.pos // self.pagesize
        end = (self.pos + size) // self.pagesize
        if (self.pos + size) % self.pagesize != 0:
            end += 1

        for i in range(start, end):
            # print('range=', i, "total=", len(self.ranges))
            r = self.ranges[i]

            if not r.cached:
                assert not self._frozen
                self.fileobj.seek(r.start, io.SEEK_SET)
                # print("fetching", r.start, r.length, os.getpid())
                data = self.fileobj.read(r.length)
                n = os.pwrite(self.cachefp.fileno(), data, r.start)
                if n < 0:
                    raise RuntimeError("bad file descriptor")

                self.ranges[i] = _Range(r.start, r.length, cached=True)

        buf = os.pread(self.cachefp.fileno(), size, self.pos)

        self.pos += len(buf)
        self.pos %= self.size
        if self.pos != self.fileobj.tell():
            self.fileobj.seek(self.pos, io.SEEK_SET)

        # cache_size_limit is a soft limit
        if self._is_full():
            os.truncate(self.cachefp.fileno(), 0)
            self._init_ranges()

        return buf



@contextmanager
def _shflock(fd):
    fcntl.flock(fd, fcntl.LOCK_SH)
    try:
        yield
    finally:
        fcntl.flock(fd, fcntl.LOCK_UN)


@contextmanager
def _exflock(fd):
    fcntl.flock(fd, fcntl.LOCK_EX)
    try:
        yield
    finally:
        fcntl.flock(fd, fcntl.LOCK_UN)



[docs]
class MPCachedWrapper(CachedWrapper):
    '''Multiprocessing version of cached wrapper

        It is internally used behind ZIP fs for multiprocessing:

    .. code-block::

        import os
        from pfio.v2 import from_url

        with from_url("s3://bucket/your.zip", local_cache=True) as fs:
          pid = os.fork()
          if pid:
            os.wait()
          else:
            with fs.open("file-in-zip.jpg", 'rb') as fp:
              data = rp.read()
    '''

    def __init__(self, fileobj, size, cachedir=None, close_on_close=False,
                 cache_size_limit=None, pagesize=16*1024*1024,
                 local_cachefile=None, local_indexfile=None,
                 multithread_safe=False):
        super().__init__(fileobj, size, cachedir, close_on_close,
                         cache_size_limit=cache_size_limit,
                         multithread_safe=multithread_safe)
        assert pagesize > 0
        self.pagesize = pagesize
        self.size = size

        # Both none or both string file
        assert bool(local_indexfile) == bool(local_cachefile)

        if local_indexfile is None:
            self.indexfp = tempfile.NamedTemporaryFile(delete=False,
                                                       dir=self.cachedir)
            self.cachefp = tempfile.NamedTemporaryFile(delete=False,
                                                       dir=self.cachedir)
            self.local_indexfile = self.indexfp.name
            self.local_cachefile = self.cachefp.name
            self._open_fd(self.indexfp.name, self.cachefp.name)
            self._init_indexfile()

        else:
            self.indexfp = open(local_indexfile, 'rb')
            self.cachefp = open(local_cachefile, 'rb')

            self._open_fd(local_indexfile, local_cachefile)

        self.pid = os.getpid()

    def close(self):
        if self._closed:
            return

        os.close(self.cachefd)
        os.close(self.indexfd)
        self.indexfp.close()
        self.cachefp.close()
        self._closed = True

    def _open_fd(self, indexfile, cachefile):
        self.local_indexfile = indexfile
        self.local_cachefile = cachefile
        self.indexfd = os.open(self.local_indexfile, os.O_RDWR)
        self.cachefd = os.open(self.local_cachefile, os.O_RDWR)

    def _init_indexfile(self):
        pagecount = self.size // self.pagesize

        for i in range(pagecount):
            r = _Range(i * self.pagesize, self.pagesize, cached=False)
            self._set_index(i, r)
            r = self._get_index(i)

        remain = self.size % self.pagesize
        if remain > 0:
            offset = pagecount * self.pagesize
            r = _Range(offset, remain, cached=False)
            self._set_index(pagecount, r)

    def _get_index(self, i):
        assert i >= 0
        width = _Range.size()
        buf = os.pread(self.indexfd, width, width * i)
        return _Range.unpack(buf)

    def _set_index(self, i, r):
        assert i >= 0
        assert r is not None
        width = _Range.size()
        written = os.pwrite(self.indexfd, r.pack(), width * i)
        assert width == written

    def read(self, size=-1) -> bytes:
        if self._closed:
            raise RuntimeError("closed")

        if size < 0 or (self.size - self.pos < size):
            size = self.size - self.pos

        start = self.pos // self.pagesize
        end = (self.pos + size) // self.pagesize
        if (self.pos + size) % self.pagesize != 0:
            end += 1

        for i in range(start, end):
            with _shflock(self.indexfd):
                r = self._get_index(i)

            if not r.cached:
                assert not self._frozen

                with _exflock(self.indexfd):
                    r = self._get_index(i)
                    if r.cached:
                        continue

                    self.fileobj.seek(r.start, io.SEEK_SET)
                    # print("fetching", r.start, r.length, os.getpid())
                    data = self.fileobj.read(r.length)
                    n = os.pwrite(self.cachefd, data, r.start)
                    if n < 0:
                        raise RuntimeError("bad file descriptor")
                    self._set_index(i, _Range(r.start, r.length, cached=True))

        buf = os.pread(self.cachefd, size, self.pos)

        self.pos += len(buf)
        self.pos %= self.size
        if self.pos != self.fileobj.tell():
            self.fileobj.seek(self.pos, io.SEEK_SET)

        with _shflock(self.indexfd):
            is_full = self._is_full()

        # If the cache file is more than the limit, just flush them all.
        if is_full:
            with _exflock(self.indexfd):
                is_full = self._is_full()
                if is_full:
                    os.truncate(self.cachefd, 0)
                    self._init_indexfile()

        return buf

    def _is_full(self):
        if self.cache_size_limit is None:
            return False
        stat = os.stat(self.local_cachefile)
        return stat.st_blocks * 512 >= self.cache_size_limit