Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
C
cpython
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Kirill Smelkov
cpython
Commits
6e165b40
Commit
6e165b40
authored
May 11, 2013
by
Benjamin Peterson
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
backout 214d8909513d for regressions (#1159051)
parent
c8759666
Changes
4
Show whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
36 additions
and
71 deletions
+36
-71
Lib/gzip.py
Lib/gzip.py
+36
-33
Lib/test/test_bz2.py
Lib/test/test_bz2.py
+0
-18
Lib/test/test_gzip.py
Lib/test/test_gzip.py
+0
-17
Misc/NEWS
Misc/NEWS
+0
-3
No files found.
Lib/gzip.py
View file @
6e165b40
...
@@ -21,6 +21,9 @@ def write32u(output, value):
...
@@ -21,6 +21,9 @@ def write32u(output, value):
# or unsigned.
# or unsigned.
output
.
write
(
struct
.
pack
(
"<L"
,
value
))
output
.
write
(
struct
.
pack
(
"<L"
,
value
))
def
read32
(
input
):
return
struct
.
unpack
(
"<I"
,
input
.
read
(
4
))[
0
]
def
open
(
filename
,
mode
=
"rb"
,
compresslevel
=
9
):
def
open
(
filename
,
mode
=
"rb"
,
compresslevel
=
9
):
"""Shorthand for GzipFile(filename, mode, compresslevel).
"""Shorthand for GzipFile(filename, mode, compresslevel).
...
@@ -181,29 +184,24 @@ class GzipFile(io.BufferedIOBase):
...
@@ -181,29 +184,24 @@ class GzipFile(io.BufferedIOBase):
self
.
crc
=
zlib
.
crc32
(
""
)
&
0xffffffff
L
self
.
crc
=
zlib
.
crc32
(
""
)
&
0xffffffff
L
self
.
size
=
0
self
.
size
=
0
def
_read_exact
(
self
,
n
):
data
=
self
.
fileobj
.
read
(
n
)
while
len
(
data
)
<
n
:
b
=
self
.
fileobj
.
read
(
n
-
len
(
data
))
if
not
b
:
raise
EOFError
(
"Compressed file ended before the "
"end-of-stream marker was reached"
)
data
+=
b
return
data
def
_read_gzip_header
(
self
):
def
_read_gzip_header
(
self
):
magic
=
self
.
fileobj
.
read
(
2
)
magic
=
self
.
fileobj
.
read
(
2
)
if
magic
!=
'
\
037
\
213
'
:
if
magic
!=
'
\
037
\
213
'
:
raise
IOError
,
'Not a gzipped file'
raise
IOError
,
'Not a gzipped file'
method
=
ord
(
self
.
fileobj
.
read
(
1
)
)
method
,
flag
,
self
.
mtime
=
struct
.
unpack
(
"<BBIxx"
,
self
.
_read_exact
(
8
))
if
method
!=
8
:
if
method
!=
8
:
raise
IOError
,
'Unknown compression method'
raise
IOError
,
'Unknown compression method'
flag
=
ord
(
self
.
fileobj
.
read
(
1
)
)
self
.
mtime
=
read32
(
self
.
fileobj
)
# extraflag = self.fileobj.read(1)
# os = self.fileobj.read(1)
self
.
fileobj
.
read
(
2
)
if
flag
&
FEXTRA
:
if
flag
&
FEXTRA
:
# Read & discard the extra field, if present
# Read & discard the extra field, if present
extra_len
,
=
struct
.
unpack
(
"<H"
,
self
.
_read_exact
(
2
))
xlen
=
ord
(
self
.
fileobj
.
read
(
1
))
self
.
_read_exact
(
extra_len
)
xlen
=
xlen
+
256
*
ord
(
self
.
fileobj
.
read
(
1
))
self
.
fileobj
.
read
(
xlen
)
if
flag
&
FNAME
:
if
flag
&
FNAME
:
# Read and discard a null-terminated string containing the filename
# Read and discard a null-terminated string containing the filename
while
True
:
while
True
:
...
@@ -217,7 +215,7 @@ class GzipFile(io.BufferedIOBase):
...
@@ -217,7 +215,7 @@ class GzipFile(io.BufferedIOBase):
if
not
s
or
s
==
'
\
000
'
:
if
not
s
or
s
==
'
\
000
'
:
break
break
if
flag
&
FHCRC
:
if
flag
&
FHCRC
:
self
.
_read_exact
(
2
)
# Read & discard the 16-bit header CRC
self
.
fileobj
.
read
(
2
)
# Read & discard the 16-bit header CRC
def
write
(
self
,
data
):
def
write
(
self
,
data
):
self
.
_check_closed
()
self
.
_check_closed
()
...
@@ -251,16 +249,20 @@ class GzipFile(io.BufferedIOBase):
...
@@ -251,16 +249,20 @@ class GzipFile(io.BufferedIOBase):
readsize
=
1024
readsize
=
1024
if
size
<
0
:
# get the whole thing
if
size
<
0
:
# get the whole thing
while
self
.
_read
(
readsize
):
try
:
while
True
:
self
.
_read
(
readsize
)
readsize
=
min
(
self
.
max_read_chunk
,
readsize
*
2
)
readsize
=
min
(
self
.
max_read_chunk
,
readsize
*
2
)
except
EOFError
:
size
=
self
.
extrasize
size
=
self
.
extrasize
else
:
# just get some more of it
else
:
# just get some more of it
try
:
while
size
>
self
.
extrasize
:
while
size
>
self
.
extrasize
:
if
not
self
.
_read
(
readsize
):
self
.
_read
(
readsize
)
readsize
=
min
(
self
.
max_read_chunk
,
readsize
*
2
)
except
EOFError
:
if
size
>
self
.
extrasize
:
if
size
>
self
.
extrasize
:
size
=
self
.
extrasize
size
=
self
.
extrasize
break
readsize
=
min
(
self
.
max_read_chunk
,
readsize
*
2
)
offset
=
self
.
offset
-
self
.
extrastart
offset
=
self
.
offset
-
self
.
extrastart
chunk
=
self
.
extrabuf
[
offset
:
offset
+
size
]
chunk
=
self
.
extrabuf
[
offset
:
offset
+
size
]
...
@@ -275,7 +277,7 @@ class GzipFile(io.BufferedIOBase):
...
@@ -275,7 +277,7 @@ class GzipFile(io.BufferedIOBase):
def
_read
(
self
,
size
=
1024
):
def
_read
(
self
,
size
=
1024
):
if
self
.
fileobj
is
None
:
if
self
.
fileobj
is
None
:
r
eturn
False
r
aise
EOFError
,
"Reached EOF"
if
self
.
_new_member
:
if
self
.
_new_member
:
# If the _new_member flag is set, we have to
# If the _new_member flag is set, we have to
...
@@ -286,7 +288,7 @@ class GzipFile(io.BufferedIOBase):
...
@@ -286,7 +288,7 @@ class GzipFile(io.BufferedIOBase):
pos
=
self
.
fileobj
.
tell
()
# Save current position
pos
=
self
.
fileobj
.
tell
()
# Save current position
self
.
fileobj
.
seek
(
0
,
2
)
# Seek to end of file
self
.
fileobj
.
seek
(
0
,
2
)
# Seek to end of file
if
pos
==
self
.
fileobj
.
tell
():
if
pos
==
self
.
fileobj
.
tell
():
r
eturn
False
r
aise
EOFError
,
"Reached EOF"
else
:
else
:
self
.
fileobj
.
seek
(
pos
)
# Return to original position
self
.
fileobj
.
seek
(
pos
)
# Return to original position
...
@@ -303,10 +305,9 @@ class GzipFile(io.BufferedIOBase):
...
@@ -303,10 +305,9 @@ class GzipFile(io.BufferedIOBase):
if
buf
==
""
:
if
buf
==
""
:
uncompress
=
self
.
decompress
.
flush
()
uncompress
=
self
.
decompress
.
flush
()
self
.
fileobj
.
seek
(
-
len
(
self
.
decompress
.
unused_data
),
1
)
self
.
_read_eof
()
self
.
_read_eof
()
self
.
_add_read_data
(
uncompress
)
self
.
_add_read_data
(
uncompress
)
r
eturn
False
r
aise
EOFError
,
'Reached EOF'
uncompress
=
self
.
decompress
.
decompress
(
buf
)
uncompress
=
self
.
decompress
.
decompress
(
buf
)
self
.
_add_read_data
(
uncompress
)
self
.
_add_read_data
(
uncompress
)
...
@@ -316,14 +317,13 @@ class GzipFile(io.BufferedIOBase):
...
@@ -316,14 +317,13 @@ class GzipFile(io.BufferedIOBase):
# so seek back to the start of the unused data, finish up
# so seek back to the start of the unused data, finish up
# this member, and read a new gzip header.
# this member, and read a new gzip header.
# (The number of bytes to seek back is the length of the unused
# (The number of bytes to seek back is the length of the unused
# data)
# data
, minus 8 because _read_eof() will rewind a further 8 bytes
)
self
.
fileobj
.
seek
(
-
len
(
self
.
decompress
.
unused_data
)
,
1
)
self
.
fileobj
.
seek
(
-
len
(
self
.
decompress
.
unused_data
)
+
8
,
1
)
# Check the CRC and file size, and set the flag so we read
# Check the CRC and file size, and set the flag so we read
# a new member on the next call
# a new member on the next call
self
.
_read_eof
()
self
.
_read_eof
()
self
.
_new_member
=
True
self
.
_new_member
=
True
return
True
def
_add_read_data
(
self
,
data
):
def
_add_read_data
(
self
,
data
):
self
.
crc
=
zlib
.
crc32
(
data
,
self
.
crc
)
&
0xffffffff
L
self
.
crc
=
zlib
.
crc32
(
data
,
self
.
crc
)
&
0xffffffff
L
...
@@ -334,11 +334,14 @@ class GzipFile(io.BufferedIOBase):
...
@@ -334,11 +334,14 @@ class GzipFile(io.BufferedIOBase):
self
.
size
=
self
.
size
+
len
(
data
)
self
.
size
=
self
.
size
+
len
(
data
)
def
_read_eof
(
self
):
def
_read_eof
(
self
):
# We've read to the end of the file.
# We've read to the end of the file, so we have to rewind in order
# to reread the 8 bytes containing the CRC and the file size.
# We check the that the computed CRC and size of the
# We check the that the computed CRC and size of the
# uncompressed data matches the stored values. Note that the size
# uncompressed data matches the stored values. Note that the size
# stored is the true file size mod 2**32.
# stored is the true file size mod 2**32.
crc32
,
isize
=
struct
.
unpack
(
"<II"
,
self
.
_read_exact
(
8
))
self
.
fileobj
.
seek
(
-
8
,
1
)
crc32
=
read32
(
self
.
fileobj
)
isize
=
read32
(
self
.
fileobj
)
# may exceed 2GB
if
crc32
!=
self
.
crc
:
if
crc32
!=
self
.
crc
:
raise
IOError
(
"CRC check failed %s != %s"
%
(
hex
(
crc32
),
raise
IOError
(
"CRC check failed %s != %s"
%
(
hex
(
crc32
),
hex
(
self
.
crc
)))
hex
(
self
.
crc
)))
...
...
Lib/test/test_bz2.py
View file @
6e165b40
...
@@ -325,24 +325,6 @@ class BZ2FileTest(BaseTest):
...
@@ -325,24 +325,6 @@ class BZ2FileTest(BaseTest):
self
.
assertRaises
(
ValueError
,
f
.
readline
)
self
.
assertRaises
(
ValueError
,
f
.
readline
)
self
.
assertRaises
(
ValueError
,
f
.
readlines
)
self
.
assertRaises
(
ValueError
,
f
.
readlines
)
def
test_read_truncated
(
self
):
# Drop the eos_magic field (6 bytes) and CRC (4 bytes).
truncated
=
self
.
DATA
[:
-
10
]
with
open
(
self
.
filename
,
'wb'
)
as
f
:
f
.
write
(
truncated
)
with
BZ2File
(
self
.
filename
)
as
f
:
self
.
assertRaises
(
EOFError
,
f
.
read
)
with
BZ2File
(
self
.
filename
)
as
f
:
self
.
assertEqual
(
f
.
read
(
len
(
self
.
TEXT
)),
self
.
TEXT
)
self
.
assertRaises
(
EOFError
,
f
.
read
,
1
)
# Incomplete 4-byte file header, and block header of at least 146 bits.
for
i
in
range
(
22
):
with
open
(
self
.
filename
,
'wb'
)
as
f
:
f
.
write
(
truncated
[:
i
])
with
BZ2File
(
self
.
filename
)
as
f
:
self
.
assertRaises
(
EOFError
,
f
.
read
,
1
)
class
BZ2CompressorTest
(
BaseTest
):
class
BZ2CompressorTest
(
BaseTest
):
def
testCompress
(
self
):
def
testCompress
(
self
):
# "Test BZ2Compressor.compress()/flush()"
# "Test BZ2Compressor.compress()/flush()"
...
...
Lib/test/test_gzip.py
View file @
6e165b40
...
@@ -289,23 +289,6 @@ class TestGzip(unittest.TestCase):
...
@@ -289,23 +289,6 @@ class TestGzip(unittest.TestCase):
with
gzip
.
GzipFile
(
fileobj
=
f
,
mode
=
"w"
)
as
g
:
with
gzip
.
GzipFile
(
fileobj
=
f
,
mode
=
"w"
)
as
g
:
self
.
assertEqual
(
g
.
name
,
""
)
self
.
assertEqual
(
g
.
name
,
""
)
def
test_read_truncated
(
self
):
data
=
data1
*
50
buf
=
io
.
BytesIO
()
with
gzip
.
GzipFile
(
fileobj
=
buf
,
mode
=
"w"
)
as
f
:
f
.
write
(
data
)
# Drop the CRC (4 bytes) and file size (4 bytes).
truncated
=
buf
.
getvalue
()[:
-
8
]
with
gzip
.
GzipFile
(
fileobj
=
io
.
BytesIO
(
truncated
))
as
f
:
self
.
assertRaises
(
EOFError
,
f
.
read
)
with
gzip
.
GzipFile
(
fileobj
=
io
.
BytesIO
(
truncated
))
as
f
:
self
.
assertEqual
(
f
.
read
(
len
(
data
)),
data
)
self
.
assertRaises
(
EOFError
,
f
.
read
,
1
)
# Incomplete 10-byte header.
for
i
in
range
(
2
,
10
):
with
gzip
.
GzipFile
(
fileobj
=
io
.
BytesIO
(
truncated
[:
i
]))
as
f
:
self
.
assertRaises
(
EOFError
,
f
.
read
,
1
)
def
test_read_with_extra
(
self
):
def
test_read_with_extra
(
self
):
# Gzip data with an extra field
# Gzip data with an extra field
gzdata
=
(
b'
\
x1f
\
x8b
\
x08
\
x04
\
xb2
\
x17
cQ
\
x02
\
xff
'
gzdata
=
(
b'
\
x1f
\
x8b
\
x08
\
x04
\
xb2
\
x17
cQ
\
x02
\
xff
'
...
...
Misc/NEWS
View file @
6e165b40
...
@@ -539,9 +539,6 @@ Library
...
@@ -539,9 +539,6 @@ Library
- Issue #13454: Fix a crash when deleting an iterator created by itertools.tee()
- Issue #13454: Fix a crash when deleting an iterator created by itertools.tee()
if all other iterators were very advanced before.
if all other iterators were very advanced before.
- Issue #1159051: GzipFile now raises EOFError when reading a corrupted file
with truncated header or footer.
- Issue #16992: On Windows in signal.set_wakeup_fd, validate the file
- Issue #16992: On Windows in signal.set_wakeup_fd, validate the file
descriptor argument.
descriptor argument.
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment