Skip to content
Projects
Groups
Snippets
Help
Loading...
Help
Support
Keyboard shortcuts
?
Submit feedback
Contribute to GitLab
Sign in / Register
Toggle navigation
C
cython
Project overview
Project overview
Details
Activity
Releases
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Issues
0
Issues
0
List
Boards
Labels
Milestones
Merge Requests
0
Merge Requests
0
Analytics
Analytics
Repository
Value Stream
Wiki
Wiki
Snippets
Snippets
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Create a new issue
Commits
Issue Boards
Open sidebar
Gwenaël Samain
cython
Commits
0f9a60d9
Commit
0f9a60d9
authored
Apr 24, 2015
by
Stefan Behnel
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
intern identifier names in parser to save memory
make sure all identifiers are EncodedString objects
parent
cf9fc1a9
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
with
52 additions
and
36 deletions
+52
-36
Cython/Compiler/Main.py
Cython/Compiler/Main.py
+24
-1
Cython/Compiler/Parsing.py
Cython/Compiler/Parsing.py
+27
-31
Cython/Compiler/Scanning.py
Cython/Compiler/Scanning.py
+1
-4
No files found.
Cython/Compiler/Main.py
View file @
0f9a60d9
...
...
@@ -19,6 +19,7 @@ from . import Errors
# conditional metaclass. These options are processed by CmdLine called from
# main() in this file.
# import Parsing
from
.StringEncoding
import
EncodedString
from
.Scanning
import
PyrexScanner
,
FileSourceDescriptor
from
.Errors
import
PyrexError
,
CompileError
,
error
,
warning
from
.Symtab
import
ModuleScope
...
...
@@ -76,7 +77,8 @@ class Context(object):
self
.
cpp
=
cpp
self
.
options
=
options
self
.
pxds
=
{}
# full name -> node tree
self
.
pxds
=
{}
# full name -> node tree
self
.
_interned
=
{}
# (type(value), value, *key_args) -> interned_value
standard_include_path
=
os
.
path
.
abspath
(
os
.
path
.
normpath
(
os
.
path
.
join
(
os
.
path
.
dirname
(
__file__
),
os
.
path
.
pardir
,
'Includes'
)))
...
...
@@ -93,6 +95,27 @@ class Context(object):
self
.
future_directives
.
update
([
print_function
,
unicode_literals
,
absolute_import
,
division
])
self
.
modules
[
'builtins'
]
=
self
.
modules
[
'__builtin__'
]
def
intern_ustring
(
self
,
value
,
encoding
=
None
):
key
=
(
EncodedString
,
value
,
encoding
)
try
:
return
self
.
_interned
[
key
]
except
KeyError
:
pass
value
=
EncodedString
(
value
)
if
encoding
:
value
.
encoding
=
encoding
self
.
_interned
[
key
]
=
value
return
value
def
intern_value
(
self
,
value
,
*
key
):
key
=
(
type
(
value
),
value
)
+
key
try
:
return
self
.
_interned
[
key
]
except
KeyError
:
pass
self
.
_interned
[
key
]
=
value
return
value
# pipeline creation functions can now be found in Pipeline.py
def
process_pxd
(
self
,
source_desc
,
scope
,
module_name
):
...
...
Cython/Compiler/Parsing.py
View file @
0f9a60d9
...
...
@@ -53,7 +53,7 @@ class Ctx(object):
d
.
update
(
kwds
)
return
ctx
def
p_ident
(
s
,
message
=
"Expected an identifier"
):
def
p_ident
(
s
,
message
=
"Expected an identifier"
):
if
s
.
sy
==
'IDENT'
:
name
=
s
.
systring
s
.
next
()
...
...
@@ -405,9 +405,9 @@ def p_trailer(s, node1):
return
p_index
(
s
,
node1
)
else
:
# s.sy == '.'
s
.
next
()
name
=
EncodedString
(
p_ident
(
s
)
)
name
=
p_ident
(
s
)
return
ExprNodes
.
AttributeNode
(
pos
,
obj
=
node1
,
attribute
=
name
)
obj
=
node1
,
attribute
=
name
)
# arglist: argument (',' argument)* [',']
# argument: [test '='] test # Really [keyword '='] test
...
...
@@ -434,7 +434,7 @@ def p_call_parse_args(s, allow_genexp = True):
if
not
arg
.
is_name
:
s
.
error
(
"Expected an identifier before '='"
,
pos
=
arg
.
pos
)
encoded_name
=
EncodedS
tring
(
arg
.
name
)
encoded_name
=
s
.
context
.
intern_us
tring
(
arg
.
name
)
keyword
=
ExprNodes
.
IdentifierStringNode
(
arg
.
pos
,
value
=
encoded_name
)
arg
=
p_test
(
s
)
...
...
@@ -643,7 +643,7 @@ def p_atom(s):
else
:
return
ExprNodes
.
StringNode
(
pos
,
value
=
bytes_value
,
unicode_value
=
unicode_value
)
elif
sy
==
'IDENT'
:
name
=
EncodedString
(
s
.
systring
)
name
=
s
.
systring
s
.
next
()
if
name
==
"None"
:
return
ExprNodes
.
NoneNode
(
pos
)
...
...
@@ -1295,7 +1295,6 @@ def p_import_statement(s):
stats
=
[]
is_absolute
=
Future
.
absolute_import
in
s
.
context
.
future_directives
for
pos
,
target_name
,
dotted_name
,
as_name
in
items
:
dotted_name
=
EncodedString
(
dotted_name
)
if
kind
==
'cimport'
:
stat
=
Nodes
.
CImportStatNode
(
pos
,
...
...
@@ -1305,7 +1304,7 @@ def p_import_statement(s):
else
:
if
as_name
and
"."
in
dotted_name
:
name_list
=
ExprNodes
.
ListNode
(
pos
,
args
=
[
ExprNodes
.
IdentifierStringNode
(
pos
,
value
=
EncodedS
tring
(
"*"
))])
ExprNodes
.
IdentifierStringNode
(
pos
,
value
=
s
.
context
.
intern_us
tring
(
"*"
))])
else
:
name_list
=
None
stat
=
Nodes
.
SingleAssignmentNode
(
...
...
@@ -1347,7 +1346,7 @@ def p_from_import_statement(s, first_statement = 0):
is_cimport
=
kind
==
'cimport'
is_parenthesized
=
False
if
s
.
sy
==
'*'
:
imported_names
=
[(
s
.
position
(),
"*"
,
None
,
None
)]
imported_names
=
[(
s
.
position
(),
s
.
context
.
intern_ustring
(
"*"
)
,
None
,
None
)]
s
.
next
()
else
:
if
s
.
sy
==
'('
:
...
...
@@ -1361,7 +1360,6 @@ def p_from_import_statement(s, first_statement = 0):
imported_names
.
append
(
p_imported_name
(
s
,
is_cimport
))
if
is_parenthesized
:
s
.
expect
(
')'
)
dotted_name
=
EncodedString
(
dotted_name
)
if
dotted_name
==
'__future__'
:
if
not
first_statement
:
s
.
error
(
"from __future__ imports must occur at the beginning of the file"
)
...
...
@@ -1388,16 +1386,12 @@ def p_from_import_statement(s, first_statement = 0):
imported_name_strings
=
[]
items
=
[]
for
(
name_pos
,
name
,
as_name
,
kind
)
in
imported_names
:
encoded_name
=
EncodedString
(
name
)
imported_name_strings
.
append
(
ExprNodes
.
IdentifierStringNode
(
name_pos
,
value
=
encoded_
name
))
ExprNodes
.
IdentifierStringNode
(
name_pos
,
value
=
name
))
items
.
append
(
(
name
,
ExprNodes
.
NameNode
(
name_pos
,
name
=
as_name
or
name
)))
(
name
,
ExprNodes
.
NameNode
(
name_pos
,
name
=
as_name
or
name
)))
import_list
=
ExprNodes
.
ListNode
(
imported_names
[
0
][
0
],
args
=
imported_name_strings
)
dotted_name
=
EncodedString
(
dotted_name
)
imported_names
[
0
][
0
],
args
=
imported_name_strings
)
return
Nodes
.
FromImportStatNode
(
pos
,
module
=
ExprNodes
.
ImportNode
(
dotted_name_pos
,
module_name
=
ExprNodes
.
IdentifierStringNode
(
pos
,
value
=
dotted_name
),
...
...
@@ -1405,8 +1399,8 @@ def p_from_import_statement(s, first_statement = 0):
name_list
=
import_list
),
items
=
items
)
imported_name_kinds
=
cython
.
declare
(
set
,
set
([
'class'
,
'struct'
,
'union'
]))
imported_name_kinds
=
cython
.
declare
(
set
,
set
([
'class'
,
'struct'
,
'union'
]))
def
p_imported_name
(
s
,
is_cimport
):
pos
=
s
.
position
()
...
...
@@ -1418,6 +1412,7 @@ def p_imported_name(s, is_cimport):
as_name
=
p_as_name
(
s
)
return
(
pos
,
name
,
as_name
,
kind
)
def
p_dotted_name
(
s
,
as_allowed
):
pos
=
s
.
position
()
target_name
=
p_ident
(
s
)
...
...
@@ -1428,7 +1423,8 @@ def p_dotted_name(s, as_allowed):
names
.
append
(
p_ident
(
s
))
if
as_allowed
:
as_name
=
p_as_name
(
s
)
return
(
pos
,
target_name
,
u'.'
.
join
(
names
),
as_name
)
return
(
pos
,
target_name
,
s
.
context
.
intern_ustring
(
u'.'
.
join
(
names
)),
as_name
)
def
p_as_name
(
s
):
if
s
.
sy
==
'IDENT'
and
s
.
systring
==
'as'
:
...
...
@@ -1437,6 +1433,7 @@ def p_as_name(s):
else
:
return
None
def
p_assert_statement
(
s
):
# s.sy == 'assert'
pos
=
s
.
position
()
...
...
@@ -1449,6 +1446,7 @@ def p_assert_statement(s):
value
=
None
return
Nodes
.
AssertStatNode
(
pos
,
cond
=
cond
,
value
=
value
)
statement_terminators
=
cython
.
declare
(
set
,
set
([
';'
,
'NEWLINE'
,
'EOF'
]))
def
p_if_statement
(
s
):
...
...
@@ -1993,8 +1991,7 @@ def p_positional_and_keyword_args(s, end_sy_set, templates = None):
arg
=
Nodes
.
CComplexBaseTypeNode
(
base_type
.
pos
,
base_type
=
base_type
,
declarator
=
declarator
)
parsed_type
=
True
keyword_node
=
ExprNodes
.
IdentifierStringNode
(
arg
.
pos
,
value
=
EncodedString
(
ident
))
keyword_node
=
ExprNodes
.
IdentifierStringNode
(
arg
.
pos
,
value
=
ident
)
keyword_args
.
append
((
keyword_node
,
arg
))
was_keyword
=
True
...
...
@@ -2105,7 +2102,7 @@ def p_c_simple_base_type(s, self_flag, nonempty, templates = None):
s
.
next
()
elif
looking_at_dotted_name
(
s
):
#print "p_c_simple_base_type: looking_at_type_name at", s.position()
name
=
s
.
systring
name
=
s
.
context
.
intern_ustring
(
s
.
systring
)
s
.
next
()
while
s
.
sy
==
'.'
:
module_path
.
append
(
name
)
...
...
@@ -2361,7 +2358,7 @@ def p_c_declarator(s, ctx = Ctx(), empty = 0, is_type = 0, cmethod_flag = 0,
if
s
.
sy
==
'('
:
s
.
next
()
if
s
.
sy
==
')'
or
looking_at_name
(
s
):
base
=
Nodes
.
CNameDeclaratorNode
(
pos
,
name
=
EncodedString
(
u""
),
cname
=
None
)
base
=
Nodes
.
CNameDeclaratorNode
(
pos
,
name
=
s
.
context
.
intern_ustring
(
u""
),
cname
=
None
)
result
=
p_c_func_declarator
(
s
,
pos
,
ctx
,
base
,
cmethod_flag
)
else
:
result
=
p_c_declarator
(
s
,
ctx
,
empty
=
empty
,
is_type
=
is_type
,
...
...
@@ -2454,7 +2451,7 @@ def p_c_simple_declarator(s, ctx, empty, is_type, cmethod_flag,
else
:
rhs
=
None
if
s
.
sy
==
'IDENT'
:
name
=
EncodedString
(
s
.
systring
)
name
=
s
.
systring
if
empty
:
error
(
s
.
position
(),
"Declarator should be empty"
)
s
.
next
()
...
...
@@ -2913,11 +2910,10 @@ def p_decorators(s):
s
.
next
()
decstring
=
p_dotted_name
(
s
,
as_allowed
=
0
)[
2
]
names
=
decstring
.
split
(
'.'
)
decorator
=
ExprNodes
.
NameNode
(
pos
,
name
=
EncodedS
tring
(
names
[
0
]))
decorator
=
ExprNodes
.
NameNode
(
pos
,
name
=
s
.
context
.
intern_us
tring
(
names
[
0
]))
for
name
in
names
[
1
:]:
decorator
=
ExprNodes
.
AttributeNode
(
pos
,
attribute
=
EncodedString
(
name
),
obj
=
decorator
)
decorator
=
ExprNodes
.
AttributeNode
(
pos
,
attribute
=
s
.
context
.
intern_ustring
(
name
),
obj
=
decorator
)
if
s
.
sy
==
'('
:
decorator
=
p_call
(
s
,
decorator
)
decorators
.
append
(
Nodes
.
DecoratorNode
(
pos
,
decorator
=
decorator
))
...
...
@@ -2928,7 +2924,7 @@ def p_def_statement(s, decorators=None):
# s.sy == 'def'
pos
=
s
.
position
()
s
.
next
()
name
=
EncodedString
(
p_ident
(
s
)
)
name
=
p_ident
(
s
)
s
.
expect
(
'('
)
args
,
star_arg
,
starstar_arg
=
p_varargslist
(
s
,
terminator
=
')'
)
s
.
expect
(
')'
)
...
...
@@ -2977,8 +2973,8 @@ def p_class_statement(s, decorators):
# s.sy == 'class'
pos
=
s
.
position
()
s
.
next
()
class_name
=
EncodedString
(
p_ident
(
s
)
)
class_name
.
encoding
=
s
.
source_encoding
class_name
=
EncodedString
(
p_ident
(
s
)
)
class_name
.
encoding
=
s
.
source_encoding
# FIXME: why is this needed?
arg_tuple
=
None
keyword_dict
=
None
starstar_arg
=
None
...
...
Cython/Compiler/Scanning.py
View file @
0f9a60d9
...
...
@@ -421,14 +421,11 @@ class PyrexScanner(Scanner):
if
systring
in
self
.
keywords
:
if
systring
==
u'print'
and
print_function
in
self
.
context
.
future_directives
:
self
.
keywords
.
discard
(
'print'
)
systring
=
EncodedString
(
systring
)
elif
systring
==
u'exec'
and
self
.
context
.
language_level
>=
3
:
self
.
keywords
.
discard
(
'exec'
)
systring
=
EncodedString
(
systring
)
else
:
sy
=
systring
else
:
systring
=
EncodedString
(
systring
)
systring
=
self
.
context
.
intern_ustring
(
systring
)
self
.
sy
=
sy
self
.
systring
=
systring
if
False
:
# debug_scanner:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment