eric: comparison DataViews/CodeMetrics.py

-:b0996e4a289e
+:1d8dd9706f46
 @exception ValueError the tokenize module is too old
 """
 import os
-import cStringIO
+import io
 import keyword
 import token
 import tokenize
-if not hasattr(tokenize, 'NL'):
-raise ValueError("tokenize.NL doesn't exist -- tokenize module too old")
 import Utilities
 KEYWORD     = token.NT_OFFSET + 1
 COMMENT     = tokenize.COMMENT
 if not text.endswith(os.linesep):
 text = "%s%s" % (text, os.linesep)
 self.lines = text.count(os.linesep)
-source = cStringIO.StringIO(text)
+source = io.BytesIO(text.encode("utf-8"))
 try:
-tokenize.tokenize(source.readline, self.__tokeneater)
+gen = tokenize.tokenize(source.readline)
-except tokenize.TokenError, msg:
+for toktype, toktext, start, end, line in gen:
-print "Token Error: %s" % str(msg)
+(srow, scol) = start
+(erow, ecol) = end
+if toktype in [token.NEWLINE, tokenize.NL]:
+self.__addToken(toktype, os.linesep, srow, scol, line)
+elif toktype in [token.INDENT, token.DEDENT]:
+self.__addToken(toktype, '', srow, scol, line)
+elif toktype == token.NAME and keyword.iskeyword(toktext):
+toktype = KEYWORD
+self.__addToken(toktype, toktext, srow, scol, line)
+else:
+self.__addToken(toktype, toktext, srow, scol, line)
+except tokenize.TokenError as msg:
+print("Token Error: %s" % str(msg))
 return
 return
 def __addToken(self, toktype, toktext, srow, scol, line):
 @param scol starting column of the token (int)
 @param line logical line the token was found (string)
 """
 self.tokenlist.append(Token(type=toktype, text=toktext, row=srow,
 col=scol, line=line))
-def __tokeneater(self, toktype, toktext, (srow, scol), (erow, ecol), line):
-"""
-Private method called by tokenize.tokenize.
-@param toktype the type of the token (int)
-@param toktext the text of the token (string)
-@param srow starting row of the token (int)
-@param scol starting column of the token (int)
-@param erow ending row of the token (int)
-@param ecol ending column of the token (int)
-@param line logical line the token was found (string)
-"""
-if toktype in [token.NEWLINE, tokenize.NL]:
-self.__addToken(toktype, os.linesep, srow, scol, line)
-return
-if toktype in [token.INDENT, token.DEDENT]:
-self.__addToken(toktype, '', srow, scol, line)
-return
-if toktype == token.NAME and keyword.iskeyword(toktext):
-toktype = KEYWORD
-self.__addToken(toktype, toktext, srow, scol, line)
 spacer = ' '
 class SourceStat(object):
 """
 def dump(self):
 """
 Public method used to format and print the collected statistics.
 """
 label_len = 79 - len(spacer) - 6 * 6
-print spacer + "FUNCTION / CLASS".ljust(label_len) + \
+print(spacer + "FUNCTION / CLASS".ljust(label_len) + \
-" START   END LINES  NLOC  COMM EMPTY"
+" START   END LINES  NLOC  COMM EMPTY")
 for id in self.identifiers + ['TOTAL ']:
 label = id
 counters = self.counters.get(id, {})
 msg = spacer + label.ljust(label_len)
 if counters.get(key, 0):
 msg += " %5d" % (counters[key],)
 else:
 msg += " " * 6
-print msg
+print(msg)
 def getCounter(self, id, key):
 """
 Public method used to get a specific counter value.
 @param filename name of the Python file to be analyzed (string)
 @param total dictionary receiving the overall code statistics
 @return a statistics object with the collected code statistics (SourceStat)
 """
-file = open(filename, 'rb')
+file = open(filename, 'r')
 try:
-text = Utilities.decode(file.read())[0].encode('utf-8')
+text = file.read()
 finally:
 file.close()
 parser = Parser()
 parser.parse(text)
 tok = parser.tokenlist[idx]
 # counting
 if tok.type == NEWLINE:
 stats.inc('nloc')
-if tok.type == COMMENT:
+elif tok.type == COMMENT:
 stats.inc('comments')
-if tok.type == EMPTY:
+elif tok.type == EMPTY:
 if parser.tokenlist[idx-1].type == token.OP:
 stats.inc('nloc')
 else:
 stats.inc('empty')
+elif tok.type == INDENT:
-if tok.type == INDENT: stats.indent(tok)
+stats.indent(tok)
-if tok.type == DEDENT: stats.dedent(tok)
+elif tok.type == DEDENT:
+stats.dedent(tok)
-if tok.type == KEYWORD:
+elif tok.type == KEYWORD:
 if tok.text in ("class", "def"):
 stats.push(parser.tokenlist[idx+1].text, tok.row)
 # collect overall statistics
 summarize(total, 'lines', parser.lines)
 total = {}
 summarize(total, 'files', len(files))
 for file in files:
-print file
+print(file)
 stats = analyze(file, total)
 stats.dump()
-print "\nSummary"
+print("\nSummary")
 for key in ['files', 'lines', 'bytes', 'comments',
 'empty lines', 'non-commentary lines']:
-print key.ljust(20) + "%6d" % total[key]
+print(key.ljust(20) + "%6d" % total[key])
 sys.exit(0)
 if __name__ == "__main__":
 main()

Mercurial Repositories > eric / file comparison

comparison: DataViews/CodeMetrics.py

DataViews/CodeMetrics.py