Context Navigation

← Previous Change
Next Change →

gzip.py

Timestamp:

Mar 19, 2014, 11:11:30 AM (11 years ago)

Author:

dmik

Message:

python: Update vendor to 2.7.6.

File:

: 1 edited

python/vendor/current/Lib/gzip.py (modified) (24 diffs)

Legend:

: Unmodified
: Added
: Removed

python/vendor/current/Lib/gzip.py

-              r2
+              r388
 # based on Andrew Kuchling's minigzip.py distributed with the zlib module
 import struct, sys, time
+import struct, sys, time, os
 import zlib
+import io
 import __builtin__
 …
     return GzipFile(filename, mode, compresslevel)
 class GzipFile:
+class GzipFile(io.BufferedIOBase):
     """The GzipFile class simulates most of the methods of a file object with
     the exception of the readinto() and truncate() methods.
 …
     def __init__(self, filename=None, mode=None,
                  compresslevel=9, fileobj=None):
+                 compresslevel=9, fileobj=None, mtime=None):
         """Constructor for the GzipFile class.
 …
         for cross-platform portability.
         The compresslevel argument is an integer from 1 to 9 controlling the
+        The compresslevel argument is an integer from 0 to 9 controlling the
         level of compression; 1 is fastest and produces the least compression,
+        and 9 is slowest and produces the most compression.  The default is 9.
+        and 9 is slowest and produces the most compression. 0 is no compression
+        at all. The default is 9.
+        The mtime argument is an optional numeric timestamp to be written
+        to the stream when compressing.  All gzip compressed streams
+        are required to contain a timestamp.  If omitted or None, the
+        current time is used.  This module ignores the timestamp when
+        decompressing; however, some programs, such as gunzip, make use
+        of it.  The format of the timestamp is the same as that of the
+        return value of time.time() and of the st_mtime member of the
+        object returned by os.stat().
         """
+        # Make sure we don't inadvertently enable universal newlines on the
+        # underlying file object - in read mode, this causes data corruption.
+        if mode:
+            mode = mode.replace('U', '')
         # guarantee the file is opened in binary mode on platforms
         # that care about that sort of thing
 …
             fileobj = self.myfileobj = __builtin__.open(filename, mode or 'rb')
         if filename is None:
+            if hasattr(fileobj, 'name'): filename = fileobj.name
+            else: filename = ''
+            # Issue #13781: os.fdopen() creates a fileobj with a bogus name
+            # attribute. Avoid saving this in the gzip header's filename field.
+            if hasattr(fileobj, 'name') and fileobj.name != '<fdopen>':
+                filename = fileobj.name
+            else:
+                filename = ''
         if mode is None:
             if hasattr(fileobj, 'mode'): mode = fileobj.mode
 …
             # Set flag indicating start of a new member
             self._new_member = True
+            # Buffer data read from gzip file. extrastart is offset in
+            # stream where buffer starts. extrasize is number of
+            # bytes remaining in buffer from current stream position.
             self.extrabuf = ""
             self.extrasize = 0
+            self.extrastart = 0
             self.name = filename
             # Starts small, scales exponentially
 …
         self.fileobj = fileobj
         self.offset = 0
+        self.mtime = mtime
         if self.mode == WRITE:
 …
         return '<gzip ' + s[1:-1] + ' ' + hex(id(self)) + '>'
+    def _check_closed(self):
+        """Raises a ValueError if the underlying file object has been closed.
+        """
+        if self.closed:
+            raise ValueError('I/O operation on closed file.')
     def _init_write(self, filename):
         self.name = filename
 …
         self.fileobj.write('\037\213')             # magic header
         self.fileobj.write('\010')                 # compression method
         fname = self.name
+        fname = os.path.basename(self.name)
         if fname.endswith(".gz"):
             fname = fname[:-3]
 …
             flags = FNAME
         self.fileobj.write(chr(flags))
+        write32u(self.fileobj, long(time.time()))
+        mtime = self.mtime
+        if mtime is None:
+            mtime = time.time()
+        write32u(self.fileobj, long(mtime))
         self.fileobj.write('\002')
         self.fileobj.write('\377')
 …
             raise IOError, 'Unknown compression method'
         flag = ord( self.fileobj.read(1) )
         # modtime = self.fileobj.read(4)
+        self.mtime = read32(self.fileobj)
         # extraflag = self.fileobj.read(1)
         # os = self.fileobj.read(1)
         self.fileobj.read(6)
+        self.fileobj.read(2)
         if flag & FEXTRA:
 …
             self.fileobj.read(2)     # Read & discard the 16-bit header CRC
     def write(self,data):
+        self._check_closed()
         if self.mode != WRITE:
             import errno
 …
         if self.fileobj is None:
             raise ValueError, "write() on closed GzipFile object"
+        # Convert data type if called by io.BufferedWriter.
+        if isinstance(data, memoryview):
+            data = data.tobytes()
         if len(data) > 0:
             self.size = self.size + len(data)
 …
             self.offset += len(data)
+        return len(data)
     def read(self, size=-1):
+        self._check_closed()
         if self.mode != READ:
             import errno
 …
                     size = self.extrasize
         chunk = self.extrabuf[:size]
         self.extrabuf = self.extrabuf[size:]
+        offset = self.offset - self.extrastart
+        chunk = self.extrabuf[offset: offset + size]
         self.extrasize = self.extrasize - size
 …
     def _unread(self, buf):
-        self.extrabuf = buf + self.extrabuf
         self.extrasize = len(buf) + self.extrasize
         self.offset -= len(buf)
 …
     def _add_read_data(self, data):
         self.crc = zlib.crc32(data, self.crc) & 0xffffffffL
+        self.extrabuf = self.extrabuf + data
+        offset = self.offset - self.extrastart
+        self.extrabuf = self.extrabuf[offset:] + data
         self.extrasize = self.extrasize + len(data)
+        self.extrastart = self.offset
         self.size = self.size + len(data)
 …
             raise IOError, "Incorrect length of data produced"
+        # Gzip files can be padded with zeroes and still have archives.
+        # Consume all zero bytes and set the file position to the first
+        # non-zero byte. See http://www.gzip.org/#faq8
+        c = "\x00"
+        while c == "\x00":
+            c = self.fileobj.read(1)
+        if c:
+            self.fileobj.seek(-1, 1)
+    @property
+    def closed(self):
+        return self.fileobj is None
     def close(self):
         if self.fileobj is None:
 …
             self.myfileobj = None
-    def __del__(self):
-        try:
-            if (self.myfileobj is None and
-                self.fileobj is None):
-                return
-        except AttributeError:
-            return
-        self.close()
     def flush(self,zlib_mode=zlib.Z_SYNC_FLUSH):
+        self._check_closed()
         if self.mode == WRITE:
             # Ensure the compressor's buffer is flushed
             self.fileobj.write(self.compress.flush(zlib_mode))
         self.fileobj.flush()
+            self.fileobj.flush()
     def fileno(self):
 …
         """
         return self.fileobj.fileno()
-    def isatty(self):
-        return False
-    def tell(self):
-        return self.offset
     def rewind(self):
 …
         self.extrabuf = ""
         self.extrasize = 0
+        self.extrastart = 0
         self.offset = 0
+    def readable(self):
+        return self.mode == READ
+    def writable(self):
+        return self.mode == WRITE
+    def seekable(self):
+        return True
     def seek(self, offset, whence=0):
 …
                 raise IOError('Negative seek in write mode')
             count = offset - self.offset
             for i in range(count // 1024):
+            for i in xrange(count // 1024):
                 self.write(1024 * '\0')
             self.write((count % 1024) * '\0')
 …
                 self.rewind()
             count = offset - self.offset
             for i in range(count // 1024):
+            for i in xrange(count // 1024):
                 self.read(1024)
             self.read(count % 1024)
+        return self.offset
     def readline(self, size=-1):
         if size < 0:
+            # Shortcut common case - newline found in buffer.
+            offset = self.offset - self.extrastart
+            i = self.extrabuf.find('\n', offset) + 1
+            if i > 0:
+                self.extrasize -= i - offset
+                self.offset += i - offset
+                return self.extrabuf[offset: i]
             size = sys.maxint
             readsize = self.min_readsize
 …
             self.min_readsize = min(readsize, self.min_readsize * 2, 512)
         return ''.join(bufs) # Return resulting line
-    def readlines(self, sizehint=0):
-        # Negative numbers result in reading all the lines
-        if sizehint <= 0:
-            sizehint = sys.maxint
-        L = []
-        while sizehint > 0:
-            line = self.readline()
-            if line == "":
-                break
-            L.append(line)
-            sizehint = sizehint - len(line)
-        return L
-    def writelines(self, L):
-        for line in L:
-            self.write(line)
-    def __iter__(self):
-        return self
-    def next(self):
-        line = self.readline()
-        if line:
-            return line
-        else:
-            raise StopIteration

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changeset 388 for python/vendor/current/Lib/gzip.py

Legend:

python/vendor/current/Lib/gzip.py

Download in other formats: