Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
C
cpython
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Kirill Smelkov
cpython
Commits
85e3ee74
Commit
85e3ee74
authored
Apr 13, 2015
by
Antoine Pitrou
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
Issue #22982: Improve BOM handling when seeking to multiple positions of a writable text file.
parent
20d31b51
Changes
4
Show whitespace changes
Inline
Side-by-side
Showing
4 changed files
with
52 additions
and
15 deletions
+52
-15
Lib/_pyio.py
Lib/_pyio.py
+15
-11
Lib/test/test_io.py
Lib/test/test_io.py
+13
-0
Misc/NEWS
Misc/NEWS
+3
-0
Modules/_io/textio.c
Modules/_io/textio.c
+21
-4
No files found.
Lib/_pyio.py
View file @
85e3ee74
...
...
@@ -1865,6 +1865,19 @@ class TextIOWrapper(TextIOBase):
return
buffer
def
seek
(
self
,
cookie
,
whence
=
0
):
def
_reset_encoder
(
position
):
"""Reset the encoder (merely useful for proper BOM handling)"""
try
:
encoder
=
self
.
_encoder
or
self
.
_get_encoder
()
except
LookupError
:
# Sometimes the encoder doesn't exist
pass
else
:
if
position
!=
0
:
encoder
.
setstate
(
0
)
else
:
encoder
.
reset
()
if
self
.
closed
:
raise
ValueError
(
"tell on closed file"
)
if
not
self
.
_seekable
:
...
...
@@ -1885,6 +1898,7 @@ class TextIOWrapper(TextIOBase):
self
.
_snapshot
=
None
if
self
.
_decoder
:
self
.
_decoder
.
reset
()
_reset_encoder
(
position
)
return
position
if
whence
!=
0
:
raise
ValueError
(
"unsupported whence (%r)"
%
(
whence
,))
...
...
@@ -1922,17 +1936,7 @@ class TextIOWrapper(TextIOBase):
raise
OSError
(
"can't restore logical file position"
)
self
.
_decoded_chars_used
=
chars_to_skip
# Finally, reset the encoder (merely useful for proper BOM handling)
try
:
encoder
=
self
.
_encoder
or
self
.
_get_encoder
()
except
LookupError
:
# Sometimes the encoder doesn't exist
pass
else
:
if
cookie
!=
0
:
encoder
.
setstate
(
0
)
else
:
encoder
.
reset
()
_reset_encoder
(
cookie
)
return
cookie
def
read
(
self
,
size
=
None
):
...
...
Lib/test/test_io.py
View file @
85e3ee74
...
...
@@ -2669,6 +2669,19 @@ class TextIOWrapperTest(unittest.TestCase):
with
self
.
open
(
filename
,
'rb'
)
as
f
:
self
.
assertEqual
(
f
.
read
(),
'bbbzzz'
.
encode
(
charset
))
def
test_seek_append_bom
(
self
):
# Same test, but first seek to the start and then to the end
filename
=
support
.
TESTFN
for
charset
in
(
'utf-8-sig'
,
'utf-16'
,
'utf-32'
):
with
self
.
open
(
filename
,
'w'
,
encoding
=
charset
)
as
f
:
f
.
write
(
'aaa'
)
with
self
.
open
(
filename
,
'a'
,
encoding
=
charset
)
as
f
:
f
.
seek
(
0
)
f
.
seek
(
0
,
self
.
SEEK_END
)
f
.
write
(
'xxx'
)
with
self
.
open
(
filename
,
'rb'
)
as
f
:
self
.
assertEqual
(
f
.
read
(),
'aaaxxx'
.
encode
(
charset
))
def
test_errors_property
(
self
):
with
self
.
open
(
support
.
TESTFN
,
"w"
)
as
f
:
self
.
assertEqual
(
f
.
errors
,
"strict"
)
...
...
Misc/NEWS
View file @
85e3ee74
...
...
@@ -29,6 +29,9 @@ Core and Builtins
Library
-------
- Issue #22982: Improve BOM handling when seeking to multiple positions of
a writable text file.
- Issue #23865: close() methods in multiple modules now are idempotent and more
robust at shutdown. If needs to release multiple resources, they are released
even if errors are occured.
...
...
Modules/_io/textio.c
View file @
85e3ee74
...
...
@@ -2042,11 +2042,10 @@ _textiowrapper_decoder_setstate(textio *self, cookie_type *cookie)
}
static
int
_textiowrapper_encoder_
setstate
(
textio
*
self
,
cookie_type
*
cookie
)
_textiowrapper_encoder_
reset
(
textio
*
self
,
int
start_of_stream
)
{
PyObject
*
res
;
/* Same as _textiowrapper_decoder_setstate() above. */
if
(
cookie
->
start_pos
==
0
&&
cookie
->
dec_flags
==
0
)
{
if
(
start_of_stream
)
{
res
=
PyObject_CallMethodObjArgs
(
self
->
encoder
,
_PyIO_str_reset
,
NULL
);
self
->
encoding_start_of_stream
=
1
;
}
...
...
@@ -2061,6 +2060,14 @@ _textiowrapper_encoder_setstate(textio *self, cookie_type *cookie)
return
0
;
}
static
int
_textiowrapper_encoder_setstate
(
textio
*
self
,
cookie_type
*
cookie
)
{
/* Same as _textiowrapper_decoder_setstate() above. */
return
_textiowrapper_encoder_reset
(
self
,
cookie
->
start_pos
==
0
&&
cookie
->
dec_flags
==
0
);
}
static
PyObject
*
textiowrapper_seek
(
textio
*
self
,
PyObject
*
args
)
{
...
...
@@ -2128,7 +2135,17 @@ textiowrapper_seek(textio *self, PyObject *args)
}
res
=
_PyObject_CallMethodId
(
self
->
buffer
,
&
PyId_seek
,
"ii"
,
0
,
2
);
Py_XDECREF
(
cookieObj
);
Py_CLEAR
(
cookieObj
);
if
(
res
==
NULL
)
goto
fail
;
if
(
self
->
encoder
)
{
/* If seek() == 0, we are at the start of stream, otherwise not */
cmp
=
PyObject_RichCompareBool
(
res
,
_PyIO_zero
,
Py_EQ
);
if
(
cmp
<
0
||
_textiowrapper_encoder_reset
(
self
,
cmp
))
{
Py_DECREF
(
res
);
goto
fail
;
}
}
return
res
;
}
else
if
(
whence
!=
0
)
{
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment