Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
C
cpython
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Kirill Smelkov
cpython
Commits
1de19ac7
Commit
1de19ac7
authored
Dec 04, 2013
by
Nadeem Vawda
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
#19839: Fix regression in bz2 module's handling of non-bzip2 data at EOF.
parent
a5cc9d68
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
51 additions
and
11 deletions
+51
-11
Lib/bz2.py
Lib/bz2.py
+19
-10
Lib/test/test_bz2.py
Lib/test/test_bz2.py
+29
-1
Misc/NEWS
Misc/NEWS
+3
-0
No files found.
Lib/bz2.py
View file @
1de19ac7
...
...
@@ -199,8 +199,15 @@ class BZ2File(io.BufferedIOBase):
# Continue to next stream.
if
self
.
_decompressor
.
eof
:
self
.
_decompressor
=
BZ2Decompressor
()
self
.
_buffer
=
self
.
_decompressor
.
decompress
(
rawblock
)
try
:
self
.
_buffer
=
self
.
_decompressor
.
decompress
(
rawblock
)
except
OSError
:
# Trailing data isn't a valid bzip2 stream. We're done here.
self
.
_mode
=
_MODE_READ_EOF
self
.
_size
=
self
.
_pos
return
False
else
:
self
.
_buffer
=
self
.
_decompressor
.
decompress
(
rawblock
)
self
.
_buffer_offset
=
0
return
True
...
...
@@ -488,17 +495,19 @@ def decompress(data):
For incremental decompression, use a BZ2Decompressor object instead.
"""
if
len
(
data
)
==
0
:
return
b""
results
=
[]
while
True
:
while
data
:
decomp
=
BZ2Decompressor
()
results
.
append
(
decomp
.
decompress
(
data
))
try
:
res
=
decomp
.
decompress
(
data
)
except
OSError
:
if
results
:
break
# Leftover data is not a valid bzip2 stream; ignore it.
else
:
raise
# Error on the first iteration; bail out.
results
.
append
(
res
)
if
not
decomp
.
eof
:
raise
ValueError
(
"Compressed data ended before the "
"end-of-stream marker was reached"
)
if
not
decomp
.
unused_data
:
return
b""
.
join
(
results
)
# There is unused data left over. Proceed to next stream.
data
=
decomp
.
unused_data
return
b""
.
join
(
results
)
Lib/test/test_bz2.py
View file @
1de19ac7
...
...
@@ -49,6 +49,7 @@ class BaseTest(unittest.TestCase):
TEXT
=
b''
.
join
(
TEXT_LINES
)
DATA
=
b'BZh91AY&SY.
\
xc8
N
\
x18
\
x00
\
x01
>_
\
x80
\
x00
\
x10
@
\
x02
\
xff
\
xf0
\
x01
\
x07
n
\
x00
?
\
xe7
\
xff
\
xe0
0
\
x01
\
x99
\
xaa
\
x00
\
xc0
\
x03
F
\
x86
\
x8c
#&
\
x83
F
\
x9a
\
x03
\
x06
\
xa6
\
xd0
\
xa6
\
x93
M
\
x0f
Q
\
xa7
\
xa8
\
x06
\
x80
4hh
\
x12
$
\
x11
\
xa4
i4
\
xf1
4S
\
xd2
<Q
\
xb5
\
x0f
H
\
xd3
\
xd4
\
xdd
\
xd5
\
x87
\
xbb
\
xf8
\
x94
\
r
\
x8f
\
xaf
I
\
x12
\
xe1
\
xc9
\
xf8
/E
\
x00
pu
\
x89
\
x12
]
\
xc9
\
xbb
DL
\
n
Q
\
x0e
\
t
1
\
x12
\
xdf
\
xa0
\
xc0
\
x97
\
xac
2O9
\
x89
\
x13
\
x94
\
x0e
\
x1c
7
\
x0e
d
\
x95
I
\
x0c
\
xaa
J
\
xa4
\
x18
L
\
x10
\
x05
#
\
x9c
\
xaf
\
xba
\
xbc
/
\
x97
\
x8a
#C
\
xc8
\
xe1
\
x8c
W
\
xf9
\
xe2
\
xd0
\
xd6
M
\
xa7
\
x8b
Xa<e
\
x84
t
\
xcb
L
\
xb3
\
xa7
\
xd9
\
xcd
\
xd1
\
xcb
\
x84
.
\
xaf
\
xb3
\
xab
\
xab
\
xad
`n}
\
xa0
lh
\
t
E,
\
x8e
Z
\
x15
\
x17
VH>
\
x88
\
xe5
\
xcd
9gd6
\
x0b
\
n
\
xe9
\
x9b
\
xd5
\
x8a
\
x99
\
xf7
\
x08
.K
\
x8e
v
\
xfb
\
xf7
xw
\
xbb
\
xdf
\
xa1
\
x92
\
xf1
\
xdd
|/";
\
xa2
\
xba
\
x9f
\
xd5
\
xb1
#A
\
xb6
\
xf6
\
xb3
o
\
xc9
\
xc5
y
\
\
\
xeb
O
\
xe7
\
x85
\
x9a
\
xbc
\
xb6
f8
\
x95
2
\
xd5
\
xd7
"%
\
x89
>V,
\
xf7
\
xa6
z
\
xe2
\
x9f
\
xa3
\
xdf
\
x11
\
x11
"
\
xd6
E)I
\
xa9
\
x13
^
\
xca
\
xf3
r
\
xd0
\
x03
U
\
x92
2
\
xf2
6
\
xec
\
xb6
\
xed
\
x8b
\
xc3
U
\
x13
\
x9d
\
xc5
\
x17
0
\
xa4
\
xfa
^
\
x92
\
xac
DF
\
x8a
\
x97
\
xd6
\
x19
\
xfe
\
xdd
\
xb8
\
xbd
\
x1a
\
x9a
\
x19
\
xa3
\
x80
ankR
\
x8b
\
xe5
\
xd8
3]
\
xa9
\
xc6
\
x08
\
x82
f
\
xf6
\
xb9
"6l$
\
xb8
j@
\
xc0
\
x8a
\
xb0
l1..
\
xba
k
\
x83
ls
\
x15
\
xbc
\
xf4
\
xc1
\
x13
\
xbe
\
xf8
E
\
xb8
\
x9d
\
r
\
xa8
\
x9d
k
\
x84
\
xd3
n
\
xfa
\
xac
Q
\
x07
\
xb1
%y
\
xaa
v
\
xb4
\
x08
\
xe0
z
\
x1b
\
x16
\
xf5
\
x04
\
xe9
\
xcc
\
xb9
\
x08
z
\
x1e
n7.G
\
xfc
]
\
xc9
\
x14
\
xe1
B@
\
xbb
!8`'
EMPTY_DATA
=
b'BZh9
\
x17
rE8P
\
x90
\
x00
\
x00
\
x00
\
x00
'
BAD_DATA
=
b'this is not a valid bzip2 file'
def
setUp
(
self
):
self
.
filename
=
TESTFN
...
...
@@ -79,9 +80,10 @@ class BaseTest(unittest.TestCase):
class
BZ2FileTest
(
BaseTest
):
"Test BZ2File type miscellaneous methods."
def
createTempFile
(
self
,
streams
=
1
):
def
createTempFile
(
self
,
streams
=
1
,
suffix
=
b""
):
with
open
(
self
.
filename
,
"wb"
)
as
f
:
f
.
write
(
self
.
DATA
*
streams
)
f
.
write
(
suffix
)
def
testBadArgs
(
self
):
with
self
.
assertRaises
(
TypeError
):
...
...
@@ -103,6 +105,11 @@ class BZ2FileTest(BaseTest):
self
.
assertRaises
(
TypeError
,
bz2f
.
read
,
None
)
self
.
assertEqual
(
bz2f
.
read
(),
self
.
TEXT
)
def
testReadBadFile
(
self
):
self
.
createTempFile
(
streams
=
0
,
suffix
=
self
.
BAD_DATA
)
with
BZ2File
(
self
.
filename
)
as
bz2f
:
self
.
assertRaises
(
OSError
,
bz2f
.
read
)
def
testReadMultiStream
(
self
):
self
.
createTempFile
(
streams
=
5
)
with
BZ2File
(
self
.
filename
)
as
bz2f
:
...
...
@@ -122,6 +129,16 @@ class BZ2FileTest(BaseTest):
finally
:
bz2
.
_BUFFER_SIZE
=
buffer_size
def
testReadTrailingJunk
(
self
):
self
.
createTempFile
(
suffix
=
self
.
BAD_DATA
)
with
BZ2File
(
self
.
filename
)
as
bz2f
:
self
.
assertEqual
(
bz2f
.
read
(),
self
.
TEXT
)
def
testReadMultiStreamTrailingJunk
(
self
):
self
.
createTempFile
(
streams
=
5
,
suffix
=
self
.
BAD_DATA
)
with
BZ2File
(
self
.
filename
)
as
bz2f
:
self
.
assertEqual
(
bz2f
.
read
(),
self
.
TEXT
*
5
)
def
testRead0
(
self
):
self
.
createTempFile
()
with
BZ2File
(
self
.
filename
)
as
bz2f
:
...
...
@@ -707,10 +724,21 @@ class CompressDecompressTest(BaseTest):
def
testDecompressIncomplete
(
self
):
self
.
assertRaises
(
ValueError
,
bz2
.
decompress
,
self
.
DATA
[:
-
10
])
def
testDecompressBadData
(
self
):
self
.
assertRaises
(
OSError
,
bz2
.
decompress
,
self
.
BAD_DATA
)
def
testDecompressMultiStream
(
self
):
text
=
bz2
.
decompress
(
self
.
DATA
*
5
)
self
.
assertEqual
(
text
,
self
.
TEXT
*
5
)
def
testDecompressTrailingJunk
(
self
):
text
=
bz2
.
decompress
(
self
.
DATA
+
self
.
BAD_DATA
)
self
.
assertEqual
(
text
,
self
.
TEXT
)
def
testDecompressMultiStreamTrailingJunk
(
self
):
text
=
bz2
.
decompress
(
self
.
DATA
*
5
+
self
.
BAD_DATA
)
self
.
assertEqual
(
text
,
self
.
TEXT
*
5
)
class
OpenTest
(
BaseTest
):
def
test_binary_modes
(
self
):
...
...
Misc/NEWS
View file @
1de19ac7
...
...
@@ -18,6 +18,9 @@ Core and Builtins
Library
-------
- Issue #19839: Fix regression in bz2 module'
s
handling
of
non
-
bzip2
data
at
EOF
.
-
Issue
#
19138
:
doctest
's IGNORE_EXCEPTION_DETAIL now allows a match when
no exception detail exists (no colon following the exception'
s
name
,
or
a
colon
does
follow
but
no
text
follows
the
colon
).
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment