string="D",
start=(1, 0),
end=(1, 1),
- line="D A C A E\n",
+ line="D A C A E",
),
TokenInfo(
type=NAME,
string="A",
start=(1, 2),
end=(1, 3),
- line="D A C A E\n",
+ line="D A C A E",
),
],
TokenInfo(
string="C",
start=(1, 4),
end=(1, 5),
- line="D A C A E\n",
+ line="D A C A E",
),
],
TokenInfo(
string="A",
start=(1, 6),
end=(1, 7),
- line="D A C A E\n",
+ line="D A C A E",
),
],
TokenInfo(
- type=NAME, string="E", start=(1, 8), end=(1, 9), line="D A C A E\n"
+ type=NAME, string="E", start=(1, 8), end=(1, 9), line="D A C A E"
),
],
)
string="B",
start=(1, 0),
end=(1, 1),
- line="B C A E\n",
+ line="B C A E",
),
TokenInfo(
type=NAME,
string="C",
start=(1, 2),
end=(1, 3),
- line="B C A E\n",
+ line="B C A E",
),
],
TokenInfo(
- type=NAME, string="A", start=(1, 4), end=(1, 5), line="B C A E\n"
+ type=NAME, string="A", start=(1, 4), end=(1, 5), line="B C A E"
),
],
TokenInfo(
- type=NAME, string="E", start=(1, 6), end=(1, 7), line="B C A E\n"
+ type=NAME, string="E", start=(1, 6), end=(1, 7), line="B C A E"
),
],
)
node,
[
TokenInfo(
- NAME, string="foo", start=(1, 0), end=(1, 3), line="foo = 12 + 12 .\n"
+ NAME, string="foo", start=(1, 0), end=(1, 3), line="foo = 12 + 12 ."
),
TokenInfo(
- OP, string="=", start=(1, 4), end=(1, 5), line="foo = 12 + 12 .\n"
+ OP, string="=", start=(1, 4), end=(1, 5), line="foo = 12 + 12 ."
),
[
TokenInfo(
string="12",
start=(1, 6),
end=(1, 8),
- line="foo = 12 + 12 .\n",
+ line="foo = 12 + 12 .",
),
[
[
string="+",
start=(1, 9),
end=(1, 10),
- line="foo = 12 + 12 .\n",
+ line="foo = 12 + 12 .",
),
TokenInfo(
NUMBER,
string="12",
start=(1, 11),
end=(1, 13),
- line="foo = 12 + 12 .\n",
+ line="foo = 12 + 12 .",
),
]
],
self.assertEqual(
node,
[
- TokenInfo(OP, string="(", start=(1, 0), end=(1, 1), line="(1)\n"),
- TokenInfo(NUMBER, string="1", start=(1, 1), end=(1, 2), line="(1)\n"),
- TokenInfo(OP, string=")", start=(1, 2), end=(1, 3), line="(1)\n"),
+ TokenInfo(OP, string="(", start=(1, 0), end=(1, 1), line="(1)"),
+ TokenInfo(NUMBER, string="1", start=(1, 1), end=(1, 2), line="(1)"),
+ TokenInfo(OP, string=")", start=(1, 2), end=(1, 3), line="(1)"),
],
)
# skip the initial encoding token and the end tokens
tokens = list(_generate_tokens_from_c_tokenizer(readline().__next__, encoding='utf-8',
extra_tokens=True))[:-2]
- expected_tokens = [TokenInfo(3, '"ЉЊЈЁЂ"', (1, 0), (1, 7), '"ЉЊЈЁЂ"\n')]
+ expected_tokens = [TokenInfo(3, '"ЉЊЈЁЂ"', (1, 0), (1, 7), '"ЉЊЈЁЂ"')]
self.assertEqual(tokens, expected_tokens,
"bytes not decoded with encoding")
TokenInfo(type=token.NUMBER, string='1', start=(1, 4), end=(1, 5), line='b = 1\n'),
TokenInfo(type=token.NEWLINE, string='\n', start=(1, 5), end=(1, 6), line='b = 1\n'),
TokenInfo(type=token.NL, string='\n', start=(2, 0), end=(2, 1), line='\n'),
- TokenInfo(type=token.COMMENT, string='#test', start=(3, 0), end=(3, 5), line='#test\n'),
- TokenInfo(type=token.NL, string='', start=(3, 5), end=(3, 6), line='#test\n'),
+ TokenInfo(type=token.COMMENT, string='#test', start=(3, 0), end=(3, 5), line='#test'),
+ TokenInfo(type=token.NL, string='', start=(3, 5), end=(3, 6), line='#test'),
TokenInfo(type=token.ENDMARKER, string='', start=(4, 0), end=(4, 0), line='')
]
TokenInfo(token.ENCODING, string='utf-8', start=(0, 0), end=(0, 0), line=''),
TokenInfo(token.NAME, string='a', start=(1, 0), end=(1, 1), line='a\n'),
TokenInfo(token.NEWLINE, string='\n', start=(1, 1), end=(1, 2), line='a\n'),
- TokenInfo(token.NL, string='', start=(2, 1), end=(2, 2), line=' \n'),
+ TokenInfo(token.NL, string='', start=(2, 1), end=(2, 2), line=' '),
TokenInfo(token.ENDMARKER, string='', start=(3, 0), end=(3, 0), line='')
]
yield "1+1".encode(encoding)
expected = [
- TokenInfo(type=NUMBER, string='1', start=(1, 0), end=(1, 1), line='1+1\n'),
- TokenInfo(type=OP, string='+', start=(1, 1), end=(1, 2), line='1+1\n'),
- TokenInfo(type=NUMBER, string='1', start=(1, 2), end=(1, 3), line='1+1\n'),
- TokenInfo(type=NEWLINE, string='', start=(1, 3), end=(1, 4), line='1+1\n'),
+ TokenInfo(type=NUMBER, string='1', start=(1, 0), end=(1, 1), line='1+1'),
+ TokenInfo(type=OP, string='+', start=(1, 1), end=(1, 2), line='1+1'),
+ TokenInfo(type=NUMBER, string='1', start=(1, 2), end=(1, 3), line='1+1'),
+ TokenInfo(type=NEWLINE, string='', start=(1, 3), end=(1, 4), line='1+1'),
TokenInfo(type=ENDMARKER, string='', start=(2, 0), end=(2, 0), line='')
]
for encoding in ["utf-8", "latin-1", "utf-16"]: