sublime-wakatime/packages/wakatime/stats.py

106 lines
2.6 KiB
Python
Raw Normal View History

2013-09-23 00:51:23 +04:00
# -*- coding: utf-8 -*-
"""
wakatime.stats
~~~~~~~~~~~~~~
Stats about files
:copyright: (c) 2013 Alan Hamlett.
:license: BSD, see LICENSE for more details.
"""
import logging
import os
import sys
2014-09-30 20:27:35 +04:00
from .compat import u, open
2014-12-23 14:39:07 +03:00
from .languages import DependencyParser
2014-09-30 20:27:35 +04:00
2013-09-23 02:24:50 +04:00
if sys.version_info[0] == 2:
2014-12-01 09:21:46 +03:00
sys.path.insert(0, os.path.join(os.path.dirname(os.path.abspath(__file__)), 'packages', 'pygments_py2'))
2013-09-23 02:24:50 +04:00
else:
2014-12-01 09:21:46 +03:00
sys.path.insert(0, os.path.join(os.path.dirname(os.path.abspath(__file__)), 'packages', 'pygments_py3'))
2013-09-23 03:31:12 +04:00
from pygments.lexers import guess_lexer_for_filename
2013-09-23 00:51:23 +04:00
log = logging.getLogger('WakaTime')
2013-09-23 00:51:23 +04:00
2013-10-26 08:33:31 +04:00
# force file name extensions to be recognized as a certain language
EXTENSIONS = {
'j2': 'HTML',
'markdown': 'Markdown',
'md': 'Markdown',
'mdown': 'Markdown',
'twig': 'Twig',
2013-10-26 08:33:31 +04:00
}
2013-10-27 04:59:41 +04:00
TRANSLATIONS = {
'CSS+Genshi Text': 'CSS',
'CSS+Lasso': 'CSS',
'HTML+Django/Jinja': 'HTML',
'HTML+Lasso': 'HTML',
'JavaScript+Genshi Text': 'JavaScript',
'JavaScript+Lasso': 'JavaScript',
'Perl6': 'Perl',
'RHTML': 'HTML',
2013-10-27 04:59:41 +04:00
}
2013-10-26 08:33:31 +04:00
2013-09-23 00:51:23 +04:00
def guess_language(file_name):
2014-12-23 14:39:07 +03:00
language, lexer = None, None
2013-09-23 00:51:23 +04:00
try:
2014-09-30 20:27:35 +04:00
with open(file_name, 'r', encoding='utf-8') as fh:
lexer = guess_lexer_for_filename(file_name, fh.read(512000))
except:
2013-09-23 00:51:23 +04:00
pass
2014-12-23 14:39:07 +03:00
if file_name:
language = guess_language_from_extension(file_name.rsplit('.', 1)[-1])
if lexer and language is None:
language = translate_language(u(lexer.name))
return language, lexer
2013-09-23 00:51:23 +04:00
2013-10-26 08:33:31 +04:00
def guess_language_from_extension(extension):
if extension:
if extension in EXTENSIONS:
return EXTENSIONS[extension]
if extension.lower() in EXTENSIONS:
2015-03-10 01:23:29 +03:00
return EXTENSIONS[extension.lower()]
2013-10-26 08:33:31 +04:00
return None
2013-10-27 04:59:41 +04:00
def translate_language(language):
if language in TRANSLATIONS:
language = TRANSLATIONS[language]
return language
2013-09-23 00:51:23 +04:00
def number_lines_in_file(file_name):
lines = 0
try:
2014-09-30 20:27:35 +04:00
with open(file_name, 'r', encoding='utf-8') as fh:
for line in fh:
2013-09-23 00:51:23 +04:00
lines += 1
except:
2013-09-23 00:51:23 +04:00
return None
return lines
2015-03-10 01:23:29 +03:00
def get_file_stats(file_name, notfile=False):
if notfile:
stats = {
'language': None,
'dependencies': [],
'lines': None,
}
else:
language, lexer = guess_language(file_name)
parser = DependencyParser(file_name, lexer)
dependencies = parser.parse()
stats = {
'language': language,
'dependencies': dependencies,
'lines': number_lines_in_file(file_name),
}
2013-09-23 00:51:23 +04:00
return stats