Source code for MDAnalysis.lib.picklable_file_io

# -*- Mode: python; tab-width: 4; indent-tabs-mode:nil; coding:utf-8 -*-
# vim: tabstop=4 expandtab shiftwidth=4 softtabstop=4
#
# MDAnalysis --- https://www.mdanalysis.org
# Copyright (c) 2006-2017 The MDAnalysis Development Team and contributors
# (see the file AUTHORS for the full list of names)
#
# Released under the GNU Public Licence, v2 or any higher version
#
# Please cite your use of MDAnalysis in published work:
#
# R. J. Gowers, M. Linke, J. Barnoud, T. J. E. Reddy, M. N. Melo, S. L. Seyler,
# D. L. Dotson, J. Domanski, S. Buchoux, I. M. Kenney, and O. Beckstein.
# MDAnalysis: A Python package for the rapid analysis of molecular dynamics
# simulations. In S. Benthall and S. Rostrup editors, Proceedings of the 15th
# Python in Science Conference, pages 102-109, Austin, TX, 2016. SciPy.
# doi: 10.25080/majora-629e541a-00e
#
# N. Michaud-Agrawal, E. J. Denning, T. B. Woolf, and O. Beckstein.
# MDAnalysis: A Toolkit for the Analysis of Molecular Dynamics Simulations.
# J. Comput. Chem. 32 (2011), 2319--2327, doi:10.1002/jcc.21787
#
"""
Picklable read-only I/O classes --- :mod:`MDAnalysis.lib.picklable_file_io`
===========================================================================

Provide with an interface for pickling read-only IO file object.
These classes are used for further pickling :class:`MDAnalysis.core.universe`
in a object composition approach.

.. autoclass:: FileIOPicklable
   :members:

.. autoclass:: BufferIOPicklable
   :members:

.. autoclass:: TextIOPicklable
   :members:

.. autoclass:: BZ2Picklable
   :members:

.. autoclass:: GzipPicklable
   :members:

.. autofunction:: pickle_open

.. autofunction:: bz2_pickle_open

.. autofunction:: gzip_pickle_open


.. versionadded:: 2.0.0
"""
import io
import os

import bz2
import gzip


[docs]class FileIOPicklable(io.FileIO): """File object (read-only) that can be pickled. This class provides a file-like object (as returned by :func:`open`, namely :class:`io.FileIO`) that, unlike standard Python file objects, can be pickled. Only read mode is supported. When the file is pickled, filename and position of the open file handle in the file are saved. On unpickling, the file is opened by filename, and the file is seeked to the saved position. This means that for a successful unpickle, the original file still has to be accessible with its filename. Note ---- This class only supports reading files in binary mode. If you need to open a file in text mode, use the :func:`pickle_open`. Parameters ---------- name : str either a text or byte string giving the name (and the path if the file isn't in the current working directory) of the file to be opened. mode : str only reading ('r') mode works. It exists to be consistent with a wider API. Example ------- :: >>> file = FileIOPicklable(PDB) >>> file.readline() >>> file_pickled = pickle.loads(pickle.dumps(file)) >>> print(file.tell(), file_pickled.tell()) 55 55 See Also --------- TextIOPicklable BufferIOPicklable .. versionadded:: 2.0.0 """ def __init__(self, name, mode='r'): self._mode = mode super().__init__(name, mode) def __getstate__(self): if self._mode != 'r': raise RuntimeError("Can only pickle files that were opened " "in read mode, not {}".format(self._mode)) return self.name, self.tell() def __setstate__(self, args): name = args[0] super().__init__(name, mode='r') self.seek(args[1])
[docs]class BufferIOPicklable(io.BufferedReader): """A picklable buffer object for read-only FileIO object. This class provides a buffered :class:`io.BufferedReader` that can be pickled. Note that this only works in read mode. Parameters ---------- raw : FileIO object Example ------- :: file = FileIOPicklable('filename') buffer_wrapped = BufferIOPicklable(file) See Also --------- FileIOPicklable TextIOPicklable .. versionadded:: 2.0.0 """ def __init__(self, raw): super().__init__(raw) self.raw_class = raw.__class__ def __getstate__(self): return self.raw_class, self.name, self.tell() def __setstate__(self, args): raw_class = args[0] name = args[1] raw = raw_class(name) super().__init__(raw) self.seek(args[2])
[docs]class TextIOPicklable(io.TextIOWrapper): """Character and line based picklable file-like object. This class provides a file-like :class:`io.TextIOWrapper` object that can be pickled. Note that this only works in read mode. Note ---- After pickling, the current position is reset. `universe.trajectory[i]` has to be used to return to its original frame. Parameters ---------- raw : FileIO object Example ------- :: file = FileIOPicklable('filename') text_wrapped = TextIOPicklable(file) See Also --------- FileIOPicklable BufferIOPicklable .. versionadded:: 2.0.0 """ def __init__(self, raw): super().__init__(raw) self.raw_class = raw.__class__ def __getstate__(self): try: name = self.name except AttributeError: # This is kind of ugly--BZ2File does not save its name. name = self.buffer._fp.name return self.raw_class, name def __setstate__(self, args): raw_class = args[0] name = args[1] # raw_class is used for further expansion this functionality to # Gzip files, which also requires a text wrapper. raw = raw_class(name) super().__init__(raw)
[docs]class BZ2Picklable(bz2.BZ2File): """File object (read-only) for bzip2 (de)compression that can be pickled. This class provides a file-like object (as returned by :func:`bz2.open`, namely :class:`bz2.BZ2File`) that, unlike standard Python file objects, can be pickled. Only read mode is supported. When the file is pickled, filename and position of the open file handle in the file are saved. On unpickling, the file is opened by filename, and the file is seeked to the saved position. This means that for a successful unpickle, the original file still has to be accessible with its filename. Note ---- This class only supports reading files in binary mode. If you need to open to open a compressed file in text mode, use :func:`bz2_pickle_open`. Parameters ---------- name : str either a text or byte string giving the name (and the path if the file isn't in the current working directory) of the file to be opened. mode : str can only be 'r', 'rb' to make pickle work. Example ------- :: >>> file = BZ2Picklable(XYZ_bz2) >>> file.readline() >>> file_pickled = pickle.loads(pickle.dumps(file)) >>> print(file.tell(), file_pickled.tell()) 5 5 See Also --------- FileIOPicklable BufferIOPicklable TextIOPicklable GzipPicklable .. versionadded:: 2.0.0 """ def __init__(self, name, mode='rb'): self._bz_mode = mode super().__init__(name, mode) def __getstate__(self): if not self._bz_mode.startswith('r'): raise RuntimeError("Can only pickle files that were opened " "in read mode, not {}".format(self._bz_mode)) return self._fp.name, self.tell() def __setstate__(self, args): super().__init__(args[0]) self.seek(args[1])
[docs]class GzipPicklable(gzip.GzipFile): """Gzip file object (read-only) that can be pickled. This class provides a file-like object (as returned by :func:`gzip.open`, namely :class:`gzip.GzipFile`) that, unlike standard Python file objects, can be pickled. Only read mode is supported. When the file is pickled, filename and position of the open file handle in the file are saved. On unpickling, the file is opened by filename, and the file is seeked to the saved position. This means that for a successful unpickle, the original file still has to be accessible with its filename. Note ---- This class only supports reading files in binary mode. If you need to open to open a compressed file in text mode, use the :func:`gzip_pickle_open`. Parameters ---------- name : str either a text or byte string giving the name (and the path if the file isn't in the current working directory) of the file to be opened. mode : str can only be 'r', 'rb' to make pickle work. Example ------- :: >>> file = GzipPicklable(MMTF_gz) >>> file.readline() >>> file_pickled = pickle.loads(pickle.dumps(file)) >>> print(file.tell(), file_pickled.tell()) 1218 1218 See Also --------- FileIOPicklable BufferIOPicklable TextIOPicklable BZ2Picklable .. versionadded:: 2.0.0 """ def __init__(self, name, mode='rb'): self._gz_mode = mode super().__init__(name, mode) def __getstate__(self): if not self._gz_mode.startswith('r'): raise RuntimeError("Can only pickle files that were opened " "in read mode, not {}".format(self._gz_mode)) return self.name, self.tell() def __setstate__(self, args): super().__init__(args[0]) self.seek(args[1])
[docs]def pickle_open(name, mode='rt'): """Open file and return a stream with pickle function implemented. This function returns a FileIOPicklable object wrapped in a BufferIOPicklable class when given the "rb" reading mode, or a FileIOPicklable object wrapped in a TextIOPicklable class with the "r" or "rt" reading mode. It can be used as a context manager, and replace the built-in :func:`open` function in read mode that only returns an unpicklable file object. In order to serialize a :class:`MDAnalysis.core.Universe`, this function can used to open trajectory/topology files. This object composition is more flexible and easier than class inheritance to implement pickling for new readers. Note ---- Can be only used with read mode. Parameters ---------- name : str either a text or byte string giving the name (and the path if the file isn't in the current working directory) of the file to be opened. mode: {'r', 'rt', 'rb'} (optional) 'r': open for reading in text mode; 'rt': read in text mode (default); 'rb': read in binary mode; Returns ------- stream-like object: BufferIOPicklable or TextIOPicklable when mode is 'r' or 'rt', returns TextIOPicklable; when mode is 'rb', returns BufferIOPicklable Raises ------ ValueError if `mode` is not one of the allowed read modes Examples ------- open as context manager:: with pickle_open('filename') as f: line = f.readline() open as function:: f = pickle_open('filename') line = f.readline() f.close() See Also -------- :func:`MDAnalysis.lib.util.anyopen` :func:`io.open` .. versionadded:: 2.0.0 """ if mode not in {'r', 'rt', 'rb'}: raise ValueError("Only read mode ('r', 'rt', 'rb') " "files can be pickled.") name = os.fspath(name) raw = FileIOPicklable(name) if mode == 'rb': return BufferIOPicklable(raw) elif mode in {'r', 'rt'}: return TextIOPicklable(raw)
[docs]def bz2_pickle_open(name, mode='rb'): """Open a bzip2-compressed file in binary or text mode with pickle function implemented. This function returns a BZ2Picklable object when given the "rb" or "r" reading mode, or a BZ2Picklable object wrapped in a TextIOPicklable class with the "rt" reading mode. It can be used as a context manager, and replace the built-in :func:`bz2.open` function in read mode that only returns an unpicklable file object. Note ---- Can be only used with read mode. Parameters ---------- name : str either a text or byte string giving the name (and the path if the file isn't in the current working directory) of the file to be opened. mode: {'r', 'rt', 'rb'} (optional) 'r': open for reading in binary mode; 'rt': read in text mode; 'rb': read in binary mode; (default) Returns ------- stream-like object: BZ2Picklable or TextIOPicklable when mode is 'rt', returns TextIOPicklable; when mode is 'r' or 'rb', returns BZ2Picklable Raises ------ ValueError if `mode` is not one of the allowed read modes Examples ------- open as context manager:: with bz2_pickle_open('filename') as f: line = f.readline() open as function:: f = bz2_pickle_open('filename') line = f.readline() f.close() See Also -------- :func:`io.open` :func:`bz2.open` :func:`MDAnalysis.lib.util.anyopen` :func:`MDAnalysis.lib.picklable_file_io.pickle_open` :func:`MDAnalysis.lib.picklable_file_io.gzip_pickle_open` .. versionadded:: 2.0.0 """ if mode not in {'r', 'rt', 'rb'}: raise ValueError("Only read mode ('r', 'rt', 'rb') " "files can be pickled.") bz_mode = mode.replace("t", "") binary_file = BZ2Picklable(name, bz_mode) if "t" in mode: return TextIOPicklable(binary_file) else: return binary_file
[docs]def gzip_pickle_open(name, mode='rb'): """Open a gzip-compressed file in binary or text mode with pickle function implemented. This function returns a GzipPicklable object when given the "rb" or "r" reading mode, or a GzipPicklable object wrapped in a TextIOPicklable class with the "rt" reading mode. It can be used as a context manager, and replace the built-in :func:`gzip.open` function in read mode that only returns an unpicklable file object. Note ---- Can be only used with read mode. Parameters ---------- name : str either a text or byte string giving the name (and the path if the file isn't in the current working directory) of the file to be opened. mode: {'r', 'rt', 'rb'} (optional) 'r': open for reading in binary mode; 'rt': read in text mode; 'rb': read in binary mode; (default) Returns ------- stream-like object: GzipPicklable or TextIOPicklable when mode is 'rt', returns TextIOPicklable; when mode is 'r' or 'rb', returns GzipPicklable Raises ------ ValueError if `mode` is not one of the allowed read modes Examples ------- open as context manager:: with gzip_pickle_open('filename') as f: line = f.readline() open as function:: f = gzip_pickle_open('filename') line = f.readline() f.close() See Also -------- :func:`io.open` :func:`gzip.open` :func:`MDAnalysis.lib.util.anyopen` :func:`MDAnalysis.lib.picklable_file_io.pickle_open` :func:`MDAnalysis.lib.picklable_file_io.bz2_pickle_open` .. versionadded:: 2.0.0 """ if mode not in {'r', 'rt', 'rb'}: raise ValueError("Only read mode ('r', 'rt', 'rb') " "files can be pickled.") gz_mode = mode.replace("t", "") binary_file = GzipPicklable(name, gz_mode) if "t" in mode: return TextIOPicklable(binary_file) else: return binary_file