@@ -31,16 +31,11 @@ class HTMLTokenizer(object):
31
31
Points to HTMLInputStream object.
32
32
"""
33
33
34
- def __init__ (self , stream , encoding = None , useChardet = True ,
35
- lowercaseElementName = True , lowercaseAttrName = True , parser = None ):
34
+ def __init__ (self , stream , encoding = None , useChardet = True , parser = None ):
36
35
37
36
self .stream = HTMLInputStream (stream , encoding , True , useChardet )
38
37
self .parser = parser
39
38
40
- # Perform case conversions?
41
- self .lowercaseElementName = lowercaseElementName
42
- self .lowercaseAttrName = lowercaseAttrName
43
-
44
39
# Setup the initial tokenizer state
45
40
self .escapeFlag = False
46
41
self .lastFourChars = []
@@ -232,8 +227,7 @@ def emitCurrentToken(self):
232
227
token = self .currentToken
233
228
# Add token to the queue to be yielded
234
229
if (token ["type" ] in tagTokenTypes ):
235
- if self .lowercaseElementName :
236
- token ["name" ] = token ["name" ].translate (asciiUpper2Lower )
230
+ token ["name" ] = token ["name" ].translate (asciiUpper2Lower )
237
231
if token ["type" ] == tokenTypes ["EndTag" ]:
238
232
if token ["data" ]:
239
233
self .tokenQueue .append ({"type" : tokenTypes ["ParseError" ],
@@ -918,9 +912,8 @@ def attributeNameState(self):
918
912
# Attributes are not dropped at this stage. That happens when the
919
913
# start tag token is emitted so values can still be safely appended
920
914
# to attributes, but we do want to report the parse error in time.
921
- if self .lowercaseAttrName :
922
- self .currentToken ["data" ][- 1 ][0 ] = (
923
- self .currentToken ["data" ][- 1 ][0 ].translate (asciiUpper2Lower ))
915
+ self .currentToken ["data" ][- 1 ][0 ] = (
916
+ self .currentToken ["data" ][- 1 ][0 ].translate (asciiUpper2Lower ))
924
917
for name , _ in self .currentToken ["data" ][:- 1 ]:
925
918
if self .currentToken ["data" ][- 1 ][0 ] == name :
926
919
self .tokenQueue .append ({"type" : tokenTypes ["ParseError" ], "data" :
0 commit comments