From 3747b009bf2ffc33910667e3c1d6dd36810ca24d Mon Sep 17 00:00:00 2001 From: farhad Date: Sun, 14 Sep 2014 11:34:27 +0400 Subject: [PATCH] fix tokenization of code containing unicode strings --- jedi/parser/tokenize.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/jedi/parser/tokenize.py b/jedi/parser/tokenize.py index d988135c..08099e79 100644 --- a/jedi/parser/tokenize.py +++ b/jedi/parser/tokenize.py @@ -137,7 +137,7 @@ double = r'[^"\\]*(?:\\.[^"\\]*)*"' single3 = r"[^'\\]*(?:(?:\\.|'(?!''))[^'\\]*)*'''" # Tail end of """ string. double3 = r'[^"\\]*(?:(?:\\.|"(?!""))[^"\\]*)*"""' -triple = group("[bB]?[rR]?'''", '[bB]?[rR]?"""') +triple = group("[uUbB]?[rR]?'''", '[uUbB]?[rR]?"""') # Single-line ' or " string. # Because of leftmost-then-longest match semantics, be sure to put the @@ -193,7 +193,7 @@ single_quoted = {} for t in ("'", '"', "r'", 'r"', "R'", 'R"', "b'", 'b"', "B'", 'B"', - "u'", 'u""', "U'", 'U"', + "u'", 'u"', "U'", 'U"', "br'", 'br"', "Br'", 'Br"', "bR'", 'bR"', "BR'", 'BR"'): single_quoted[t] = t