Edit File by line

"""Functions that read and write gzipped files.

[0] Fix | Delete

[1] Fix | Delete

The user of the file doesn't have to worry about the compression,

[2] Fix | Delete

but random access is not allowed."""

[3] Fix | Delete

[4] Fix | Delete

# based on Andrew Kuchling's minigzip.py distributed with the zlib module

[5] Fix | Delete

[6] Fix | Delete

import struct, sys, time, os

[7] Fix | Delete

import zlib

[8] Fix | Delete

import builtins

[9] Fix | Delete

import io

[10] Fix | Delete

import _compression

[11] Fix | Delete

[12] Fix | Delete

__all__ = ["BadGzipFile", "GzipFile", "open", "compress", "decompress"]

[13] Fix | Delete

[14] Fix | Delete

FTEXT, FHCRC, FEXTRA, FNAME, FCOMMENT = 1, 2, 4, 8, 16

[15] Fix | Delete

[16] Fix | Delete

READ, WRITE = 1, 2

[17] Fix | Delete

[18] Fix | Delete

_COMPRESS_LEVEL_FAST = 1

[19] Fix | Delete

_COMPRESS_LEVEL_TRADEOFF = 6

[20] Fix | Delete

_COMPRESS_LEVEL_BEST = 9

[21] Fix | Delete

[22] Fix | Delete

[23] Fix | Delete

def open(filename, mode="rb", compresslevel=_COMPRESS_LEVEL_BEST,

[24] Fix | Delete

encoding=None, errors=None, newline=None):

[25] Fix | Delete

"""Open a gzip-compressed file in binary or text mode.

[26] Fix | Delete

[27] Fix | Delete

The filename argument can be an actual filename (a str or bytes object), or

[28] Fix | Delete

an existing file object to read from or write to.

[29] Fix | Delete

[30] Fix | Delete

The mode argument can be "r", "rb", "w", "wb", "x", "xb", "a" or "ab" for

[31] Fix | Delete

binary mode, or "rt", "wt", "xt" or "at" for text mode. The default mode is

[32] Fix | Delete

"rb", and the default compresslevel is 9.

[33] Fix | Delete

[34] Fix | Delete

For binary mode, this function is equivalent to the GzipFile constructor:

[35] Fix | Delete

GzipFile(filename, mode, compresslevel). In this case, the encoding, errors

[36] Fix | Delete

and newline arguments must not be provided.

[37] Fix | Delete

[38] Fix | Delete

For text mode, a GzipFile object is created, and wrapped in an

[39] Fix | Delete

io.TextIOWrapper instance with the specified encoding, error handling

[40] Fix | Delete

behavior, and line ending(s).

[41] Fix | Delete

[42] Fix | Delete

"""

[43] Fix | Delete

if "t" in mode:

[44] Fix | Delete

if "b" in mode:

[45] Fix | Delete

raise ValueError("Invalid mode: %r" % (mode,))

[46] Fix | Delete

else:

[47] Fix | Delete

if encoding is not None:

[48] Fix | Delete

raise ValueError("Argument 'encoding' not supported in binary mode")

[49] Fix | Delete

if errors is not None:

[50] Fix | Delete

raise ValueError("Argument 'errors' not supported in binary mode")

[51] Fix | Delete

if newline is not None:

[52] Fix | Delete

raise ValueError("Argument 'newline' not supported in binary mode")

[53] Fix | Delete

[54] Fix | Delete

gz_mode = mode.replace("t", "")

[55] Fix | Delete

if isinstance(filename, (str, bytes, os.PathLike)):

[56] Fix | Delete

binary_file = GzipFile(filename, gz_mode, compresslevel)

[57] Fix | Delete

elif hasattr(filename, "read") or hasattr(filename, "write"):

[58] Fix | Delete

binary_file = GzipFile(None, gz_mode, compresslevel, filename)

[59] Fix | Delete

else:

[60] Fix | Delete

raise TypeError("filename must be a str or bytes object, or a file")

[61] Fix | Delete

[62] Fix | Delete

if "t" in mode:

[63] Fix | Delete

return io.TextIOWrapper(binary_file, encoding, errors, newline)

[64] Fix | Delete

else:

[65] Fix | Delete

return binary_file

[66] Fix | Delete

[67] Fix | Delete

def write32u(output, value):

[68] Fix | Delete

# The L format writes the bit pattern correctly whether signed

[69] Fix | Delete

# or unsigned.

[70] Fix | Delete

output.write(struct.pack("<L", value))

[71] Fix | Delete

[72] Fix | Delete

class _PaddedFile:

[73] Fix | Delete

"""Minimal read-only file object that prepends a string to the contents

[74] Fix | Delete

of an actual file. Shouldn't be used outside of gzip.py, as it lacks

[75] Fix | Delete

essential functionality."""

[76] Fix | Delete

[77] Fix | Delete

def __init__(self, f, prepend=b''):

[78] Fix | Delete

self._buffer = prepend

[79] Fix | Delete

self._length = len(prepend)

[80] Fix | Delete

self.file = f

[81] Fix | Delete

self._read = 0

[82] Fix | Delete

[83] Fix | Delete

def read(self, size):

[84] Fix | Delete

if self._read is None:

[85] Fix | Delete

return self.file.read(size)

[86] Fix | Delete

if self._read + size <= self._length:

[87] Fix | Delete

read = self._read

[88] Fix | Delete

self._read += size

[89] Fix | Delete

return self._buffer[read:self._read]

[90] Fix | Delete

else:

[91] Fix | Delete

read = self._read

[92] Fix | Delete

self._read = None

[93] Fix | Delete

return self._buffer[read:] + \

[94] Fix | Delete

self.file.read(size-self._length+read)

[95] Fix | Delete

[96] Fix | Delete

def prepend(self, prepend=b''):

[97] Fix | Delete

if self._read is None:

[98] Fix | Delete

self._buffer = prepend

[99] Fix | Delete

else: # Assume data was read since the last prepend() call

[100] Fix | Delete

self._read -= len(prepend)

[101] Fix | Delete

return

[102] Fix | Delete

self._length = len(self._buffer)

[103] Fix | Delete

self._read = 0

[104] Fix | Delete

[105] Fix | Delete

def seek(self, off):

[106] Fix | Delete

self._read = None

[107] Fix | Delete

self._buffer = None

[108] Fix | Delete

return self.file.seek(off)

[109] Fix | Delete

[110] Fix | Delete

def seekable(self):

[111] Fix | Delete

return True # Allows fast-forwarding even in unseekable streams

[112] Fix | Delete

[113] Fix | Delete

[114] Fix | Delete

class BadGzipFile(OSError):

[115] Fix | Delete

"""Exception raised in some cases for invalid gzip files."""

[116] Fix | Delete

[117] Fix | Delete

[118] Fix | Delete

class GzipFile(_compression.BaseStream):

[119] Fix | Delete

"""The GzipFile class simulates most of the methods of a file object with

[120] Fix | Delete

the exception of the truncate() method.

[121] Fix | Delete

[122] Fix | Delete

This class only supports opening files in binary mode. If you need to open a

[123] Fix | Delete

compressed file in text mode, use the gzip.open() function.

[124] Fix | Delete

[125] Fix | Delete

"""

[126] Fix | Delete

[127] Fix | Delete

# Overridden with internal file object to be closed, if only a filename

[128] Fix | Delete

# is passed in

[129] Fix | Delete

myfileobj = None

[130] Fix | Delete

[131] Fix | Delete

def __init__(self, filename=None, mode=None,

[132] Fix | Delete

compresslevel=_COMPRESS_LEVEL_BEST, fileobj=None, mtime=None):

[133] Fix | Delete

"""Constructor for the GzipFile class.

[134] Fix | Delete

[135] Fix | Delete

At least one of fileobj and filename must be given a

[136] Fix | Delete

non-trivial value.

[137] Fix | Delete

[138] Fix | Delete

The new class instance is based on fileobj, which can be a regular

[139] Fix | Delete

file, an io.BytesIO object, or any other object which simulates a file.

[140] Fix | Delete

It defaults to None, in which case filename is opened to provide

[141] Fix | Delete

a file object.

[142] Fix | Delete

[143] Fix | Delete

When fileobj is not None, the filename argument is only used to be

[144] Fix | Delete

included in the gzip file header, which may include the original

[145] Fix | Delete

filename of the uncompressed file. It defaults to the filename of

[146] Fix | Delete

fileobj, if discernible; otherwise, it defaults to the empty string,

[147] Fix | Delete

and in this case the original filename is not included in the header.

[148] Fix | Delete

[149] Fix | Delete

The mode argument can be any of 'r', 'rb', 'a', 'ab', 'w', 'wb', 'x', or

[150] Fix | Delete

'xb' depending on whether the file will be read or written. The default

[151] Fix | Delete

is the mode of fileobj if discernible; otherwise, the default is 'rb'.

[152] Fix | Delete

A mode of 'r' is equivalent to one of 'rb', and similarly for 'w' and

[153] Fix | Delete

'wb', 'a' and 'ab', and 'x' and 'xb'.

[154] Fix | Delete

[155] Fix | Delete

The compresslevel argument is an integer from 0 to 9 controlling the

[156] Fix | Delete

level of compression; 1 is fastest and produces the least compression,

[157] Fix | Delete

and 9 is slowest and produces the most compression. 0 is no compression

[158] Fix | Delete

at all. The default is 9.

[159] Fix | Delete

[160] Fix | Delete

The mtime argument is an optional numeric timestamp to be written

[161] Fix | Delete

to the last modification time field in the stream when compressing.

[162] Fix | Delete

If omitted or None, the current time is used.

[163] Fix | Delete

[164] Fix | Delete

"""

[165] Fix | Delete

[166] Fix | Delete

if mode and ('t' in mode or 'U' in mode):

[167] Fix | Delete

raise ValueError("Invalid mode: {!r}".format(mode))

[168] Fix | Delete

if mode and 'b' not in mode:

[169] Fix | Delete

mode += 'b'

[170] Fix | Delete

if fileobj is None:

[171] Fix | Delete

fileobj = self.myfileobj = builtins.open(filename, mode or 'rb')

[172] Fix | Delete

if filename is None:

[173] Fix | Delete

filename = getattr(fileobj, 'name', '')

[174] Fix | Delete

if not isinstance(filename, (str, bytes)):

[175] Fix | Delete

filename = ''

[176] Fix | Delete

else:

[177] Fix | Delete

filename = os.fspath(filename)

[178] Fix | Delete

origmode = mode

[179] Fix | Delete

if mode is None:

[180] Fix | Delete

mode = getattr(fileobj, 'mode', 'rb')

[181] Fix | Delete

[182] Fix | Delete

if mode.startswith('r'):

[183] Fix | Delete

self.mode = READ

[184] Fix | Delete

raw = _GzipReader(fileobj)

[185] Fix | Delete

self._buffer = io.BufferedReader(raw)

[186] Fix | Delete

self.name = filename

[187] Fix | Delete

[188] Fix | Delete

elif mode.startswith(('w', 'a', 'x')):

[189] Fix | Delete

if origmode is None:

[190] Fix | Delete

import warnings

[191] Fix | Delete

warnings.warn(

[192] Fix | Delete

"GzipFile was opened for writing, but this will "

[193] Fix | Delete

"change in future Python releases. "

[194] Fix | Delete

"Specify the mode argument for opening it for writing.",

[195] Fix | Delete

FutureWarning, 2)

[196] Fix | Delete

self.mode = WRITE

[197] Fix | Delete

self._init_write(filename)

[198] Fix | Delete

self.compress = zlib.compressobj(compresslevel,

[199] Fix | Delete

zlib.DEFLATED,

[200] Fix | Delete

-zlib.MAX_WBITS,

[201] Fix | Delete

zlib.DEF_MEM_LEVEL,

[202] Fix | Delete

[203] Fix | Delete

self._write_mtime = mtime

[204] Fix | Delete

else:

[205] Fix | Delete

raise ValueError("Invalid mode: {!r}".format(mode))

[206] Fix | Delete

[207] Fix | Delete

self.fileobj = fileobj

[208] Fix | Delete

[209] Fix | Delete

if self.mode == WRITE:

[210] Fix | Delete

self._write_gzip_header(compresslevel)

[211] Fix | Delete

[212] Fix | Delete

@property

[213] Fix | Delete

def filename(self):

[214] Fix | Delete

import warnings

[215] Fix | Delete

warnings.warn("use the name attribute", DeprecationWarning, 2)

[216] Fix | Delete

if self.mode == WRITE and self.name[-3:] != ".gz":

[217] Fix | Delete

return self.name + ".gz"

[218] Fix | Delete

return self.name

[219] Fix | Delete

[220] Fix | Delete

@property

[221] Fix | Delete

def mtime(self):

[222] Fix | Delete

"""Last modification time read from stream, or None"""

[223] Fix | Delete

return self._buffer.raw._last_mtime

[224] Fix | Delete

[225] Fix | Delete

def __repr__(self):

[226] Fix | Delete

s = repr(self.fileobj)

[227] Fix | Delete

return '<gzip ' + s[1:-1] + ' ' + hex(id(self)) + '>'

[228] Fix | Delete

[229] Fix | Delete

def _init_write(self, filename):

[230] Fix | Delete

self.name = filename

[231] Fix | Delete

self.crc = zlib.crc32(b"")

[232] Fix | Delete

self.size = 0

[233] Fix | Delete

self.writebuf = []

[234] Fix | Delete

self.bufsize = 0

[235] Fix | Delete

self.offset = 0 # Current file offset for seek(), tell(), etc

[236] Fix | Delete

[237] Fix | Delete

def _write_gzip_header(self, compresslevel):

[238] Fix | Delete

self.fileobj.write(b'\037\213') # magic header

[239] Fix | Delete

self.fileobj.write(b'\010') # compression method

[240] Fix | Delete

try:

[241] Fix | Delete

# RFC 1952 requires the FNAME field to be Latin-1. Do not

[242] Fix | Delete

# include filenames that cannot be represented that way.

[243] Fix | Delete

fname = os.path.basename(self.name)

[244] Fix | Delete

if not isinstance(fname, bytes):

[245] Fix | Delete

fname = fname.encode('latin-1')

[246] Fix | Delete

if fname.endswith(b'.gz'):

[247] Fix | Delete

fname = fname[:-3]

[248] Fix | Delete

except UnicodeEncodeError:

[249] Fix | Delete

fname = b''

[250] Fix | Delete

flags = 0

[251] Fix | Delete

if fname:

[252] Fix | Delete

flags = FNAME

[253] Fix | Delete

self.fileobj.write(chr(flags).encode('latin-1'))

[254] Fix | Delete

mtime = self._write_mtime

[255] Fix | Delete

if mtime is None:

[256] Fix | Delete

mtime = time.time()

[257] Fix | Delete

write32u(self.fileobj, int(mtime))

[258] Fix | Delete

if compresslevel == _COMPRESS_LEVEL_BEST:

[259] Fix | Delete

xfl = b'\002'

[260] Fix | Delete

elif compresslevel == _COMPRESS_LEVEL_FAST:

[261] Fix | Delete

xfl = b'\004'

[262] Fix | Delete

else:

[263] Fix | Delete

xfl = b'\000'

[264] Fix | Delete

self.fileobj.write(xfl)

[265] Fix | Delete

self.fileobj.write(b'\377')

[266] Fix | Delete

if fname:

[267] Fix | Delete

self.fileobj.write(fname + b'\000')

[268] Fix | Delete

[269] Fix | Delete

def write(self,data):

[270] Fix | Delete

self._check_not_closed()

[271] Fix | Delete

if self.mode != WRITE:

[272] Fix | Delete

import errno

[273] Fix | Delete

raise OSError(errno.EBADF, "write() on read-only GzipFile object")

[274] Fix | Delete

[275] Fix | Delete

if self.fileobj is None:

[276] Fix | Delete

raise ValueError("write() on closed GzipFile object")

[277] Fix | Delete

[278] Fix | Delete

if isinstance(data, bytes):

[279] Fix | Delete

length = len(data)

[280] Fix | Delete

else:

[281] Fix | Delete

# accept any data that supports the buffer protocol

[282] Fix | Delete

data = memoryview(data)

[283] Fix | Delete

length = data.nbytes

[284] Fix | Delete

[285] Fix | Delete

if length > 0:

[286] Fix | Delete

self.fileobj.write(self.compress.compress(data))

[287] Fix | Delete

self.size += length

[288] Fix | Delete

self.crc = zlib.crc32(data, self.crc)

[289] Fix | Delete

self.offset += length

[290] Fix | Delete

[291] Fix | Delete

return length

[292] Fix | Delete

[293] Fix | Delete

def read(self, size=-1):

[294] Fix | Delete

self._check_not_closed()

[295] Fix | Delete

if self.mode != READ:

[296] Fix | Delete

import errno

[297] Fix | Delete

raise OSError(errno.EBADF, "read() on write-only GzipFile object")

[298] Fix | Delete

return self._buffer.read(size)

[299] Fix | Delete

[300] Fix | Delete

def read1(self, size=-1):

[301] Fix | Delete

"""Implements BufferedIOBase.read1()

[302] Fix | Delete

[303] Fix | Delete

Reads up to a buffer's worth of data if size is negative."""

[304] Fix | Delete

self._check_not_closed()

[305] Fix | Delete

if self.mode != READ:

[306] Fix | Delete

import errno

[307] Fix | Delete

raise OSError(errno.EBADF, "read1() on write-only GzipFile object")

[308] Fix | Delete

[309] Fix | Delete

if size < 0:

[310] Fix | Delete

size = io.DEFAULT_BUFFER_SIZE

[311] Fix | Delete

return self._buffer.read1(size)

[312] Fix | Delete

[313] Fix | Delete

def peek(self, n):

[314] Fix | Delete

self._check_not_closed()

[315] Fix | Delete

if self.mode != READ:

[316] Fix | Delete

import errno

[317] Fix | Delete

raise OSError(errno.EBADF, "peek() on write-only GzipFile object")

[318] Fix | Delete

return self._buffer.peek(n)

[319] Fix | Delete

[320] Fix | Delete

@property

[321] Fix | Delete

def closed(self):

[322] Fix | Delete

return self.fileobj is None

[323] Fix | Delete

[324] Fix | Delete

def close(self):

[325] Fix | Delete

fileobj = self.fileobj

[326] Fix | Delete

if fileobj is None:

[327] Fix | Delete

return

[328] Fix | Delete

self.fileobj = None

[329] Fix | Delete

try:

[330] Fix | Delete

if self.mode == WRITE:

[331] Fix | Delete

fileobj.write(self.compress.flush())

[332] Fix | Delete

write32u(fileobj, self.crc)

[333] Fix | Delete

# self.size may exceed 2 GiB, or even 4 GiB

[334] Fix | Delete

write32u(fileobj, self.size & 0xffffffff)

[335] Fix | Delete

elif self.mode == READ:

[336] Fix | Delete

self._buffer.close()

[337] Fix | Delete

finally:

[338] Fix | Delete

myfileobj = self.myfileobj

[339] Fix | Delete

if myfileobj:

[340] Fix | Delete

self.myfileobj = None

[341] Fix | Delete

myfileobj.close()

[342] Fix | Delete

[343] Fix | Delete

def flush(self,zlib_mode=zlib.Z_SYNC_FLUSH):

[344] Fix | Delete

self._check_not_closed()

[345] Fix | Delete

if self.mode == WRITE:

[346] Fix | Delete

# Ensure the compressor's buffer is flushed

[347] Fix | Delete

self.fileobj.write(self.compress.flush(zlib_mode))

[348] Fix | Delete

self.fileobj.flush()

[349] Fix | Delete

[350] Fix | Delete

def fileno(self):

[351] Fix | Delete

"""Invoke the underlying file object's fileno() method.

[352] Fix | Delete

[353] Fix | Delete

This will raise AttributeError if the underlying file object

[354] Fix | Delete

doesn't support fileno().

[355] Fix | Delete

"""

[356] Fix | Delete

return self.fileobj.fileno()

[357] Fix | Delete

[358] Fix | Delete

def rewind(self):

[359] Fix | Delete

'''Return the uncompressed stream file position indicator to the

[360] Fix | Delete

beginning of the file'''

[361] Fix | Delete

if self.mode != READ:

[362] Fix | Delete

raise OSError("Can't rewind in write mode")

[363] Fix | Delete

self._buffer.seek(0)

[364] Fix | Delete

[365] Fix | Delete

def readable(self):

[366] Fix | Delete

return self.mode == READ

[367] Fix | Delete

[368] Fix | Delete

def writable(self):

[369] Fix | Delete

return self.mode == WRITE

[370] Fix | Delete

[371] Fix | Delete

def seekable(self):

[372] Fix | Delete

return True

[373] Fix | Delete

[374] Fix | Delete

def seek(self, offset, whence=io.SEEK_SET):

[375] Fix | Delete

if self.mode == WRITE:

[376] Fix | Delete

if whence != io.SEEK_SET:

[377] Fix | Delete

if whence == io.SEEK_CUR:

[378] Fix | Delete

offset = self.offset + offset

[379] Fix | Delete

else:

[380] Fix | Delete

raise ValueError('Seek from end not supported')

[381] Fix | Delete

if offset < self.offset:

[382] Fix | Delete

raise OSError('Negative seek in write mode')

[383] Fix | Delete

count = offset - self.offset

[384] Fix | Delete

chunk = b'\0' * 1024

[385] Fix | Delete

for i in range(count // 1024):

[386] Fix | Delete

self.write(chunk)

[387] Fix | Delete

self.write(b'\0' * (count % 1024))

[388] Fix | Delete

elif self.mode == READ:

[389] Fix | Delete

self._check_not_closed()

[390] Fix | Delete

return self._buffer.seek(offset, whence)

[391] Fix | Delete

[392] Fix | Delete

return self.offset

[393] Fix | Delete

[394] Fix | Delete

def readline(self, size=-1):

[395] Fix | Delete

self._check_not_closed()

[396] Fix | Delete

return self._buffer.readline(size)

[397] Fix | Delete

[398] Fix | Delete

[399] Fix | Delete

class _GzipReader(_compression.DecompressReader):

[400] Fix | Delete

def __init__(self, fp):

[401] Fix | Delete

super().__init__(_PaddedFile(fp), zlib.decompressobj,

[402] Fix | Delete

wbits=-zlib.MAX_WBITS)

[403] Fix | Delete

# Set flag indicating start of a new member

[404] Fix | Delete

self._new_member = True

[405] Fix | Delete

self._last_mtime = None

[406] Fix | Delete

[407] Fix | Delete

def _init_read(self):

[408] Fix | Delete

self._crc = zlib.crc32(b"")

[409] Fix | Delete

self._stream_size = 0 # Decompressed size of unconcatenated stream

[410] Fix | Delete

[411] Fix | Delete

def _read_exact(self, n):

[412] Fix | Delete

'''Read exactly *n* bytes from `self._fp`

[413] Fix | Delete

[414] Fix | Delete

This method is required because self._fp may be unbuffered,

[415] Fix | Delete

i.e. return short reads.

[416] Fix | Delete

'''

[417] Fix | Delete

[418] Fix | Delete

data = self._fp.read(n)

[419] Fix | Delete

while len(data) < n:

[420] Fix | Delete

b = self._fp.read(n - len(data))

[421] Fix | Delete

if not b:

[422] Fix | Delete

raise EOFError("Compressed file ended before the "

[423] Fix | Delete

"end-of-stream marker was reached")

[424] Fix | Delete

data += b

[425] Fix | Delete

return data

[426] Fix | Delete

[427] Fix | Delete

def _read_gzip_header(self):

[428] Fix | Delete

magic = self._fp.read(2)

[429] Fix | Delete

if magic == b'':

[430] Fix | Delete

return False

[431] Fix | Delete

[432] Fix | Delete

if magic != b'\037\213':

[433] Fix | Delete

raise BadGzipFile('Not a gzipped file (%r)' % magic)

[434] Fix | Delete

[435] Fix | Delete

(method, flag,

[436] Fix | Delete

self._last_mtime) = struct.unpack("<BBIxx", self._read_exact(8))

[437] Fix | Delete

if method != 8:

[438] Fix | Delete

raise BadGzipFile('Unknown compression method')

[439] Fix | Delete

[440] Fix | Delete

if flag & FEXTRA:

[441] Fix | Delete

# Read & discard the extra field, if present

[442] Fix | Delete

extra_len, = struct.unpack("<H", self._read_exact(2))

[443] Fix | Delete

self._read_exact(extra_len)

[444] Fix | Delete

if flag & FNAME:

[445] Fix | Delete

# Read and discard a null-terminated string containing the filename

[446] Fix | Delete

while True:

[447] Fix | Delete

s = self._fp.read(1)

[448] Fix | Delete

if not s or s==b'\000':

[449] Fix | Delete

break

[450] Fix | Delete

if flag & FCOMMENT:

[451] Fix | Delete

# Read and discard a null-terminated string containing a comment

[452] Fix | Delete

while True:

[453] Fix | Delete

s = self._fp.read(1)

[454] Fix | Delete

if not s or s==b'\000':

[455] Fix | Delete

break

[456] Fix | Delete

if flag & FHCRC:

[457] Fix | Delete

self._read_exact(2) # Read & discard the 16-bit header CRC

[458] Fix | Delete

return True

[459] Fix | Delete

[460] Fix | Delete

def read(self, size=-1):

[461] Fix | Delete

if size < 0:

[462] Fix | Delete

return self.readall()

[463] Fix | Delete

# size=0 is special because decompress(max_length=0) is not supported

[464] Fix | Delete

if not size:

[465] Fix | Delete

return b""

[466] Fix | Delete

[467] Fix | Delete

# For certain input data, a single

[468] Fix | Delete

# call to decompress() may not return

[469] Fix | Delete

# any data. In this case, retry until we get some data or reach EOF.

[470] Fix | Delete

while True:

[471] Fix | Delete

if self._decompressor.eof:

[472] Fix | Delete

# Ending case: we've come to the end of a member in the file,

[473] Fix | Delete

# so finish up this member, and read a new gzip header.

[474] Fix | Delete

# Check the CRC and file size, and set the flag so we read

[475] Fix | Delete

# a new member

[476] Fix | Delete

self._read_eof()

[477] Fix | Delete

self._new_member = True

[478] Fix | Delete

self._decompressor = self._decomp_factory(

[479] Fix | Delete

**self._decomp_args)

[480] Fix | Delete

[481] Fix | Delete

if self._new_member:

[482] Fix | Delete

# If the _new_member flag is set, we have to

[483] Fix | Delete

# jump to the next member, if there is one.

[484] Fix | Delete

self._init_read()

[485] Fix | Delete

if not self._read_gzip_header():

[486] Fix | Delete

self._size = self._pos

[487] Fix | Delete

return b""

[488] Fix | Delete

self._new_member = False

[489] Fix | Delete

[490] Fix | Delete

# Read a chunk of data from the file

[491] Fix | Delete

buf = self._fp.read(io.DEFAULT_BUFFER_SIZE)

[492] Fix | Delete

[493] Fix | Delete

uncompress = self._decompressor.decompress(buf, size)

[494] Fix | Delete

if self._decompressor.unconsumed_tail != b"":

[495] Fix | Delete

self._fp.prepend(self._decompressor.unconsumed_tail)

[496] Fix | Delete

elif self._decompressor.unused_data != b"":

[497] Fix | Delete

# Prepend the already read bytes to the fileobj so they can

[498] Fix | Delete

# be seen by _read_eof() and _read_gzip_header()

[499] Fix | Delete