Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(37)

Side by Side Diff: tools/lexer_generator/regex_parser.py

Issue 157813004: Experimental parser: store literals as ints (Closed) Base URL: https://v8.googlecode.com/svn/branches/experimental/parser
Patch Set: Created 6 years, 10 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch | Annotate | Revision Log
« no previous file with comments | « tools/lexer_generator/nfa_builder.py ('k') | tools/lexer_generator/transition_key_test.py » ('j') | no next file with comments »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 # Copyright 2013 the V8 project authors. All rights reserved. 1 # Copyright 2013 the V8 project authors. All rights reserved.
2 # Redistribution and use in source and binary forms, with or without 2 # Redistribution and use in source and binary forms, with or without
3 # modification, are permitted provided that the following conditions are 3 # modification, are permitted provided that the following conditions are
4 # met: 4 # met:
5 # 5 #
6 # * Redistributions of source code must retain the above copyright 6 # * Redistributions of source code must retain the above copyright
7 # notice, this list of conditions and the following disclaimer. 7 # notice, this list of conditions and the following disclaimer.
8 # * Redistributions in binary form must reproduce the above 8 # * Redistributions in binary form must reproduce the above
9 # copyright notice, this list of conditions and the following 9 # copyright notice, this list of conditions and the following
10 # disclaimer in the documentation and/or other materials provided 10 # disclaimer in the documentation and/or other materials provided
(...skipping 220 matching lines...) Expand 10 before | Expand all | Expand 10 after
231 p[0] = ("REPEAT", p[2], p[2]) 231 p[0] = ("REPEAT", p[2], p[2])
232 elif len(p) == 6: 232 elif len(p) == 6:
233 p[0] = ("REPEAT", p[2], p[4]) 233 p[0] = ("REPEAT", p[2], p[4])
234 elif p[1]: 234 elif p[1]:
235 p[0] = (self.token_map[p[1]],) 235 p[0] = (self.token_map[p[1]],)
236 else: 236 else:
237 p[0] = None 237 p[0] = None
238 238
239 def p_literal(self, p): 239 def p_literal(self, p):
240 '''literal : LITERAL''' 240 '''literal : LITERAL'''
241 p[0] = Term('LITERAL', p[1]) 241 p[0] = Term('LITERAL', ord(p[1]))
242 242
243 def p_any(self, p): 243 def p_any(self, p):
244 '''any : ANY''' 244 '''any : ANY'''
245 p[0] = Term(self.token_map[p[1]]) 245 p[0] = Term(self.token_map[p[1]])
246 246
247 def p_class(self, p): 247 def p_class(self, p):
248 '''class : CLASS_BEGIN class_content CLASS_END 248 '''class : CLASS_BEGIN class_content CLASS_END
249 | CLASS_BEGIN NOT class_content CLASS_END''' 249 | CLASS_BEGIN NOT class_content CLASS_END'''
250 if len(p) == 4: 250 if len(p) == 4:
251 p[0] = Term("CLASS", p[2]) 251 p[0] = Term("CLASS", p[2])
252 else: 252 else:
253 p[0] = Term("NOT_CLASS", p[3]) 253 p[0] = Term("NOT_CLASS", p[3])
254 254
255 def p_group(self, p): 255 def p_group(self, p):
256 '''group : GROUP_BEGIN start GROUP_END''' 256 '''group : GROUP_BEGIN start GROUP_END'''
257 p[0] = p[2] 257 p[0] = p[2]
258 258
259 def p_class_content(self, p): 259 def p_class_content(self, p):
260 '''class_content : CLASS_LITERAL RANGE CLASS_LITERAL maybe_class_content 260 '''class_content : CLASS_LITERAL RANGE CLASS_LITERAL maybe_class_content
261 | CLASS_LITERAL maybe_class_content 261 | CLASS_LITERAL maybe_class_content
262 | CHARACTER_CLASS maybe_class_content 262 | CHARACTER_CLASS maybe_class_content
263 ''' 263 '''
264 if len(p) == 5: 264 if len(p) == 5:
265 left = Term("RANGE", p[1], p[3]) 265 left = Term("RANGE", ord(p[1]), ord(p[3]))
266 else: 266 else:
267 if len(p[1]) == 1: 267 if len(p[1]) == 1:
268 left = Term('LITERAL', p[1]) 268 left = Term('LITERAL', ord(p[1]))
269 else: 269 else:
270 left = Term('CHARACTER_CLASS', p[1][1:-1]) 270 left = Term('CHARACTER_CLASS', p[1][1:-1])
271 p[0] = self.__cat(left, p[len(p)-1]) 271 p[0] = self.__cat(left, p[len(p)-1])
272 272
273 def p_maybe_class_content(self, p): 273 def p_maybe_class_content(self, p):
274 '''maybe_class_content : class_content 274 '''maybe_class_content : class_content
275 | empty''' 275 | empty'''
276 p[0] = p[1] 276 p[0] = p[1]
277 277
278 def p_empty(self, p): 278 def p_empty(self, p):
279 'empty :' 279 'empty :'
280 280
281 def p_error(self, p): 281 def p_error(self, p):
282 raise Exception("Syntax error in input '%s'" % str(p)) 282 raise Exception("Syntax error in input '%s'" % str(p))
283 283
284 @staticmethod 284 @staticmethod
285 def __cat(left, right): 285 def __cat(left, right):
286 assert left 286 assert left
287 return NfaBuilder.cat_terms([left] if not right else [left, right]) 287 return NfaBuilder.cat_terms([left] if not right else [left, right])
288 288
289 @staticmethod 289 @staticmethod
290 def parse(string): 290 def parse(string):
291 new_lexer = lambda: RegexLexer() 291 new_lexer = lambda: RegexLexer()
292 new_parser = lambda: RegexParser() 292 new_parser = lambda: RegexParser()
293 return ParserBuilder.parse(string, "RegexParser", new_lexer, new_parser) 293 return ParserBuilder.parse(string, "RegexParser", new_lexer, new_parser)
OLDNEW
« no previous file with comments | « tools/lexer_generator/nfa_builder.py ('k') | tools/lexer_generator/transition_key_test.py » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698