Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
C
cpython
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Kirill Smelkov
cpython
Commits
efdad60c
Commit
efdad60c
authored
Mar 19, 2004
by
Hye-Shik Chang
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
Add a new unicode codec: ptcp154 (Kazakh)
parent
a3d1c2e8
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
172 additions
and
0 deletions
+172
-0
Doc/lib/libcodecs.tex
Doc/lib/libcodecs.tex
+4
-0
Lib/encodings/aliases.py
Lib/encodings/aliases.py
+6
-0
Lib/encodings/ptcp154.py
Lib/encodings/ptcp154.py
+162
-0
No files found.
Doc/lib/libcodecs.tex
View file @
efdad60c
...
...
@@ -829,6 +829,10 @@ exist:
{
macturkish
}
{
Turkish
}
\lineiii
{
ptcp154
}
{
csptcp154, pt154, cp154, cyrillic-asian
}
{
Kazakh
}
\lineiii
{
shift
_
jis
}
{
csshiftjis, shiftjis, sjis, s
_
jis
}
{
Japanese
}
...
...
Lib/encodings/aliases.py
View file @
efdad60c
...
...
@@ -396,6 +396,12 @@ aliases = {
# mbcs codec
'dbcs'
:
'mbcs'
,
# ptcp154 codec
'csptcp154'
:
'ptcp154'
,
'pt154'
:
'ptcp154'
,
'cp154'
:
'ptcp154'
,
'cyrillic-asian'
:
'ptcp154'
,
# quopri_codec codec
'quopri'
:
'quopri_codec'
,
'quoted_printable'
:
'quopri_codec'
,
...
...
Lib/encodings/ptcp154.py
0 → 100644
View file @
efdad60c
""" Python Character Mapping Codec generated from 'PTCP154.txt' with gencodec.py.
Written by Marc-Andre Lemburg (mal@lemburg.com).
(c) Copyright CNRI, All Rights Reserved. NO WARRANTY.
(c) Copyright 2000 Guido van Rossum.
"""
#"
import
codecs
### Codec APIs
class
Codec
(
codecs
.
Codec
):
def
encode
(
self
,
input
,
errors
=
'strict'
):
return
codecs
.
charmap_encode
(
input
,
errors
,
encoding_map
)
def
decode
(
self
,
input
,
errors
=
'strict'
):
return
codecs
.
charmap_decode
(
input
,
errors
,
decoding_map
)
class
StreamWriter
(
Codec
,
codecs
.
StreamWriter
):
pass
class
StreamReader
(
Codec
,
codecs
.
StreamReader
):
pass
### encodings module API
def
getregentry
():
return
(
Codec
().
encode
,
Codec
().
decode
,
StreamReader
,
StreamWriter
)
### Decoding Map
decoding_map
=
codecs
.
make_identity_dict
(
range
(
256
))
decoding_map
.
update
({
0x0080
:
0x0496
,
# CYRILLIC CAPITAL LETTER ZHE WITH DESCENDER
0x0081
:
0x0492
,
# CYRILLIC CAPITAL LETTER GHE WITH STROKE
0x0082
:
0x04ee
,
# CYRILLIC CAPITAL LETTER U WITH MACRON
0x0083
:
0x0493
,
# CYRILLIC SMALL LETTER GHE WITH STROKE
0x0084
:
0x201e
,
# DOUBLE LOW-9 QUOTATION MARK
0x0085
:
0x2026
,
# HORIZONTAL ELLIPSIS
0x0086
:
0x04b6
,
# CYRILLIC CAPITAL LETTER CHE WITH DESCENDER
0x0087
:
0x04ae
,
# CYRILLIC CAPITAL LETTER STRAIGHT U
0x0088
:
0x04b2
,
# CYRILLIC CAPITAL LETTER HA WITH DESCENDER
0x0089
:
0x04af
,
# CYRILLIC SMALL LETTER STRAIGHT U
0x008a
:
0x04a0
,
# CYRILLIC CAPITAL LETTER BASHKIR KA
0x008b
:
0x04e2
,
# CYRILLIC CAPITAL LETTER I WITH MACRON
0x008c
:
0x04a2
,
# CYRILLIC CAPITAL LETTER EN WITH DESCENDER
0x008d
:
0x049a
,
# CYRILLIC CAPITAL LETTER KA WITH DESCENDER
0x008e
:
0x04ba
,
# CYRILLIC CAPITAL LETTER SHHA
0x008f
:
0x04b8
,
# CYRILLIC CAPITAL LETTER CHE WITH VERTICAL STROKE
0x0090
:
0x0497
,
# CYRILLIC SMALL LETTER ZHE WITH DESCENDER
0x0091
:
0x2018
,
# LEFT SINGLE QUOTATION MARK
0x0092
:
0x2019
,
# RIGHT SINGLE QUOTATION MARK
0x0093
:
0x201c
,
# LEFT DOUBLE QUOTATION MARK
0x0094
:
0x201d
,
# RIGHT DOUBLE QUOTATION MARK
0x0095
:
0x2022
,
# BULLET
0x0096
:
0x2013
,
# EN DASH
0x0097
:
0x2014
,
# EM DASH
0x0098
:
0x04b3
,
# CYRILLIC SMALL LETTER HA WITH DESCENDER
0x0099
:
0x04b7
,
# CYRILLIC SMALL LETTER CHE WITH DESCENDER
0x009a
:
0x04a1
,
# CYRILLIC SMALL LETTER BASHKIR KA
0x009b
:
0x04e3
,
# CYRILLIC SMALL LETTER I WITH MACRON
0x009c
:
0x04a3
,
# CYRILLIC SMALL LETTER EN WITH DESCENDER
0x009d
:
0x049b
,
# CYRILLIC SMALL LETTER KA WITH DESCENDER
0x009e
:
0x04bb
,
# CYRILLIC SMALL LETTER SHHA
0x009f
:
0x04b9
,
# CYRILLIC SMALL LETTER CHE WITH VERTICAL STROKE
0x00a1
:
0x040e
,
# CYRILLIC CAPITAL LETTER SHORT U (Byelorussian)
0x00a2
:
0x045e
,
# CYRILLIC SMALL LETTER SHORT U (Byelorussian)
0x00a3
:
0x0408
,
# CYRILLIC CAPITAL LETTER JE
0x00a4
:
0x04e8
,
# CYRILLIC CAPITAL LETTER BARRED O
0x00a5
:
0x0498
,
# CYRILLIC CAPITAL LETTER ZE WITH DESCENDER
0x00a6
:
0x04b0
,
# CYRILLIC CAPITAL LETTER STRAIGHT U WITH STROKE
0x00a8
:
0x0401
,
# CYRILLIC CAPITAL LETTER IO
0x00aa
:
0x04d8
,
# CYRILLIC CAPITAL LETTER SCHWA
0x00ad
:
0x04ef
,
# CYRILLIC SMALL LETTER U WITH MACRON
0x00af
:
0x049c
,
# CYRILLIC CAPITAL LETTER KA WITH VERTICAL STROKE
0x00b1
:
0x04b1
,
# CYRILLIC SMALL LETTER STRAIGHT U WITH STROKE
0x00b2
:
0x0406
,
# CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
0x00b3
:
0x0456
,
# CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
0x00b4
:
0x0499
,
# CYRILLIC SMALL LETTER ZE WITH DESCENDER
0x00b5
:
0x04e9
,
# CYRILLIC SMALL LETTER BARRED O
0x00b8
:
0x0451
,
# CYRILLIC SMALL LETTER IO
0x00b9
:
0x2116
,
# NUMERO SIGN
0x00ba
:
0x04d9
,
# CYRILLIC SMALL LETTER SCHWA
0x00bc
:
0x0458
,
# CYRILLIC SMALL LETTER JE
0x00bd
:
0x04aa
,
# CYRILLIC CAPITAL LETTER ES WITH DESCENDER
0x00be
:
0x04ab
,
# CYRILLIC SMALL LETTER ES WITH DESCENDER
0x00bf
:
0x049d
,
# CYRILLIC SMALL LETTER KA WITH VERTICAL STROKE
0x00c0
:
0x0410
,
# CYRILLIC CAPITAL LETTER A
0x00c1
:
0x0411
,
# CYRILLIC CAPITAL LETTER BE
0x00c2
:
0x0412
,
# CYRILLIC CAPITAL LETTER VE
0x00c3
:
0x0413
,
# CYRILLIC CAPITAL LETTER GHE
0x00c4
:
0x0414
,
# CYRILLIC CAPITAL LETTER DE
0x00c5
:
0x0415
,
# CYRILLIC CAPITAL LETTER IE
0x00c6
:
0x0416
,
# CYRILLIC CAPITAL LETTER ZHE
0x00c7
:
0x0417
,
# CYRILLIC CAPITAL LETTER ZE
0x00c8
:
0x0418
,
# CYRILLIC CAPITAL LETTER I
0x00c9
:
0x0419
,
# CYRILLIC CAPITAL LETTER SHORT I
0x00ca
:
0x041a
,
# CYRILLIC CAPITAL LETTER KA
0x00cb
:
0x041b
,
# CYRILLIC CAPITAL LETTER EL
0x00cc
:
0x041c
,
# CYRILLIC CAPITAL LETTER EM
0x00cd
:
0x041d
,
# CYRILLIC CAPITAL LETTER EN
0x00ce
:
0x041e
,
# CYRILLIC CAPITAL LETTER O
0x00cf
:
0x041f
,
# CYRILLIC CAPITAL LETTER PE
0x00d0
:
0x0420
,
# CYRILLIC CAPITAL LETTER ER
0x00d1
:
0x0421
,
# CYRILLIC CAPITAL LETTER ES
0x00d2
:
0x0422
,
# CYRILLIC CAPITAL LETTER TE
0x00d3
:
0x0423
,
# CYRILLIC CAPITAL LETTER U
0x00d4
:
0x0424
,
# CYRILLIC CAPITAL LETTER EF
0x00d5
:
0x0425
,
# CYRILLIC CAPITAL LETTER HA
0x00d6
:
0x0426
,
# CYRILLIC CAPITAL LETTER TSE
0x00d7
:
0x0427
,
# CYRILLIC CAPITAL LETTER CHE
0x00d8
:
0x0428
,
# CYRILLIC CAPITAL LETTER SHA
0x00d9
:
0x0429
,
# CYRILLIC CAPITAL LETTER SHCHA
0x00da
:
0x042a
,
# CYRILLIC CAPITAL LETTER HARD SIGN
0x00db
:
0x042b
,
# CYRILLIC CAPITAL LETTER YERU
0x00dc
:
0x042c
,
# CYRILLIC CAPITAL LETTER SOFT SIGN
0x00dd
:
0x042d
,
# CYRILLIC CAPITAL LETTER E
0x00de
:
0x042e
,
# CYRILLIC CAPITAL LETTER YU
0x00df
:
0x042f
,
# CYRILLIC CAPITAL LETTER YA
0x00e0
:
0x0430
,
# CYRILLIC SMALL LETTER A
0x00e1
:
0x0431
,
# CYRILLIC SMALL LETTER BE
0x00e2
:
0x0432
,
# CYRILLIC SMALL LETTER VE
0x00e3
:
0x0433
,
# CYRILLIC SMALL LETTER GHE
0x00e4
:
0x0434
,
# CYRILLIC SMALL LETTER DE
0x00e5
:
0x0435
,
# CYRILLIC SMALL LETTER IE
0x00e6
:
0x0436
,
# CYRILLIC SMALL LETTER ZHE
0x00e7
:
0x0437
,
# CYRILLIC SMALL LETTER ZE
0x00e8
:
0x0438
,
# CYRILLIC SMALL LETTER I
0x00e9
:
0x0439
,
# CYRILLIC SMALL LETTER SHORT I
0x00ea
:
0x043a
,
# CYRILLIC SMALL LETTER KA
0x00eb
:
0x043b
,
# CYRILLIC SMALL LETTER EL
0x00ec
:
0x043c
,
# CYRILLIC SMALL LETTER EM
0x00ed
:
0x043d
,
# CYRILLIC SMALL LETTER EN
0x00ee
:
0x043e
,
# CYRILLIC SMALL LETTER O
0x00ef
:
0x043f
,
# CYRILLIC SMALL LETTER PE
0x00f0
:
0x0440
,
# CYRILLIC SMALL LETTER ER
0x00f1
:
0x0441
,
# CYRILLIC SMALL LETTER ES
0x00f2
:
0x0442
,
# CYRILLIC SMALL LETTER TE
0x00f3
:
0x0443
,
# CYRILLIC SMALL LETTER U
0x00f4
:
0x0444
,
# CYRILLIC SMALL LETTER EF
0x00f5
:
0x0445
,
# CYRILLIC SMALL LETTER HA
0x00f6
:
0x0446
,
# CYRILLIC SMALL LETTER TSE
0x00f7
:
0x0447
,
# CYRILLIC SMALL LETTER CHE
0x00f8
:
0x0448
,
# CYRILLIC SMALL LETTER SHA
0x00f9
:
0x0449
,
# CYRILLIC SMALL LETTER SHCHA
0x00fa
:
0x044a
,
# CYRILLIC SMALL LETTER HARD SIGN
0x00fb
:
0x044b
,
# CYRILLIC SMALL LETTER YERU
0x00fc
:
0x044c
,
# CYRILLIC SMALL LETTER SOFT SIGN
0x00fd
:
0x044d
,
# CYRILLIC SMALL LETTER E
0x00fe
:
0x044e
,
# CYRILLIC SMALL LETTER YU
0x00ff
:
0x044f
,
# CYRILLIC SMALL LETTER YA
})
### Encoding Map
encoding_map
=
codecs
.
make_encoding_map
(
decoding_map
)
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment