Skip to content

Commit 10f027f

Browse files
tushargrbmcutler
authored andcommitted
fix python_tokenizer tok_name error (#9)
* fix python_tokenizer tok_name error * remove import which is not required in python_tokenizer.py * remove empty value tokens
1 parent 5dbf127 commit 10f027f

File tree

1 file changed

+8
-9
lines changed

1 file changed

+8
-9
lines changed

tokenizer/python/python_tokenizer.py

+8-9
Original file line numberDiff line numberDiff line change
@@ -1,21 +1,20 @@
11
import parso
22
from parso.python.tokenize import tokenize
3-
from parso.python.token import tok_name
43
import json
5-
import sys
4+
import sys
65

76
file = open(sys.argv[1],'r')
87
file_content = file.read()
98

109
tokens = []
1110

1211
for token in tokenize(file_content, version_info=(3,6)):
13-
tmp = dict()
14-
tmp["line"]=(token.start_pos)[0];
15-
tmp["char"]=((token.start_pos)[1])+1;
16-
tmp["type"]=str(tok_name[token.type])
17-
tmp["value"]=str(token.string)
18-
tokens.append(tmp)
12+
if (str(token.string) != ""):
13+
tmp = dict()
14+
tmp["line"]=(token.start_pos)[0];
15+
tmp["char"]=((token.start_pos)[1])+1;
16+
tmp["type"]=((str(token.type))[10:]).strip(")")
17+
tmp["value"]=str(token.string)
18+
tokens.append(tmp)
1919

2020
print ( json.dumps(tokens, indent=4, sort_keys=True) )
21-

0 commit comments

Comments
 (0)