Commit f0eeedf0 authored by Serhiy Storchaka's avatar Serhiy Storchaka

Issue #22681: Added support for the koi8_t encoding.

parent ad8a1c3f
...@@ -1160,6 +1160,10 @@ particular, the following variants typically exist: ...@@ -1160,6 +1160,10 @@ particular, the following variants typically exist:
+-----------------+--------------------------------+--------------------------------+ +-----------------+--------------------------------+--------------------------------+
| koi8_r | | Russian | | koi8_r | | Russian |
+-----------------+--------------------------------+--------------------------------+ +-----------------+--------------------------------+--------------------------------+
| koi8_t | | Tajik |
| | | |
| | | .. versionadded:: 3.5 |
+-----------------+--------------------------------+--------------------------------+
| koi8_u | | Ukrainian | | koi8_u | | Ukrainian |
+-----------------+--------------------------------+--------------------------------+ +-----------------+--------------------------------+--------------------------------+
| kz1048 | kz_1048, strk1048_2002, rk1048 | Kazakh | | kz1048 | kz_1048, strk1048_2002, rk1048 | Kazakh |
......
...@@ -234,6 +234,9 @@ Some smaller changes made to the core Python language are: ...@@ -234,6 +234,9 @@ Some smaller changes made to the core Python language are:
* New Kazakh :ref:`codec <standard-encodings>` ``kz1048``. (Contributed by * New Kazakh :ref:`codec <standard-encodings>` ``kz1048``. (Contributed by
Serhiy Storchaka in :issue:`22682`.) Serhiy Storchaka in :issue:`22682`.)
* New Tajik :ref:`codec <standard-encodings>` ``koi8_t``. (Contributed by
Serhiy Storchaka in :issue:`22681`.)
New Modules New Modules
=========== ===========
......
...@@ -699,6 +699,7 @@ locale_encoding_alias = { ...@@ -699,6 +699,7 @@ locale_encoding_alias = {
'euc_kr': 'eucKR', 'euc_kr': 'eucKR',
'utf_8': 'UTF-8', 'utf_8': 'UTF-8',
'koi8_r': 'KOI8-R', 'koi8_r': 'KOI8-R',
'koi8_t': 'KOI8-T',
'koi8_u': 'KOI8-U', 'koi8_u': 'KOI8-U',
'kz1048': 'RK1048', 'kz1048': 'RK1048',
'cp1251': 'CP1251', 'cp1251': 'CP1251',
......
...@@ -1822,6 +1822,7 @@ all_unicode_encodings = [ ...@@ -1822,6 +1822,7 @@ all_unicode_encodings = [
"iso8859_9", "iso8859_9",
"johab", "johab",
"koi8_r", "koi8_r",
"koi8_t",
"koi8_u", "koi8_u",
"kz1048", "kz1048",
"latin_1", "latin_1",
......
...@@ -2081,7 +2081,8 @@ class UnicodeTest(string_tests.CommonTest, ...@@ -2081,7 +2081,8 @@ class UnicodeTest(string_tests.CommonTest,
'cp863', 'cp865', 'cp866', 'cp1125', 'cp863', 'cp865', 'cp866', 'cp1125',
'iso8859_10', 'iso8859_13', 'iso8859_14', 'iso8859_15', 'iso8859_10', 'iso8859_13', 'iso8859_14', 'iso8859_15',
'iso8859_2', 'iso8859_3', 'iso8859_4', 'iso8859_5', 'iso8859_6', 'iso8859_2', 'iso8859_3', 'iso8859_4', 'iso8859_5', 'iso8859_6',
'iso8859_7', 'iso8859_9', 'koi8_r', 'kz1048', 'latin_1', 'iso8859_7', 'iso8859_9',
'koi8_r', 'koi8_t', 'koi8_u', 'kz1048', 'latin_1',
'mac_cyrillic', 'mac_latin2', 'mac_cyrillic', 'mac_latin2',
'cp1250', 'cp1251', 'cp1252', 'cp1253', 'cp1254', 'cp1255', 'cp1250', 'cp1251', 'cp1252', 'cp1253', 'cp1254', 'cp1255',
...@@ -2109,14 +2110,14 @@ class UnicodeTest(string_tests.CommonTest, ...@@ -2109,14 +2110,14 @@ class UnicodeTest(string_tests.CommonTest,
'cp863', 'cp865', 'cp866', 'cp1125', 'cp863', 'cp865', 'cp866', 'cp1125',
'iso8859_10', 'iso8859_13', 'iso8859_14', 'iso8859_15', 'iso8859_10', 'iso8859_13', 'iso8859_14', 'iso8859_15',
'iso8859_2', 'iso8859_4', 'iso8859_5', 'iso8859_2', 'iso8859_4', 'iso8859_5',
'iso8859_9', 'koi8_r', 'latin_1', 'iso8859_9', 'koi8_r', 'koi8_u', 'latin_1',
'mac_cyrillic', 'mac_latin2', 'mac_cyrillic', 'mac_latin2',
### These have undefined mappings: ### These have undefined mappings:
#'cp1250', 'cp1251', 'cp1252', 'cp1253', 'cp1254', 'cp1255', #'cp1250', 'cp1251', 'cp1252', 'cp1253', 'cp1254', 'cp1255',
#'cp1256', 'cp1257', 'cp1258', #'cp1256', 'cp1257', 'cp1258',
#'cp424', 'cp856', 'cp857', 'cp864', 'cp869', 'cp874', #'cp424', 'cp856', 'cp857', 'cp864', 'cp869', 'cp874',
#'iso8859_3', 'iso8859_6', 'iso8859_7', 'kz1048', #'iso8859_3', 'iso8859_6', 'iso8859_7', 'koi8_t', 'kz1048',
#'mac_greek', 'mac_iceland','mac_roman', 'mac_turkish', #'mac_greek', 'mac_iceland','mac_roman', 'mac_turkish',
### These fail the round-trip: ### These fail the round-trip:
......
...@@ -704,7 +704,7 @@ class ElementTreeTest(unittest.TestCase): ...@@ -704,7 +704,7 @@ class ElementTreeTest(unittest.TestCase):
'mac-roman', 'mac-turkish', 'mac-roman', 'mac-turkish',
'iso2022-jp', 'iso2022-jp-1', 'iso2022-jp-2', 'iso2022-jp-2004', 'iso2022-jp', 'iso2022-jp-1', 'iso2022-jp-2', 'iso2022-jp-2004',
'iso2022-jp-3', 'iso2022-jp-ext', 'iso2022-jp-3', 'iso2022-jp-ext',
'koi8-r', 'koi8-u', 'kz1048', 'koi8-r', 'koi8-t', 'koi8-u', 'kz1048',
'hz', 'ptcp154', 'hz', 'ptcp154',
] ]
for encoding in supported_encodings: for encoding in supported_encodings:
......
...@@ -42,6 +42,8 @@ Core and Builtins ...@@ -42,6 +42,8 @@ Core and Builtins
Library Library
------- -------
- Issue #22681: Added support for the koi8_t encoding.
- Issue #22682: Added support for the kz1048 encoding. - Issue #22682: Added support for the kz1048 encoding.
- Issue #23796: peak and read1 methods of BufferedReader now raise ValueError - Issue #23796: peak and read1 methods of BufferedReader now raise ValueError
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment