2014-12-23 05:12:57 +00:00
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
"""
|
|
|
|
wakatime.languages
|
|
|
|
~~~~~~~~~~~~~~~~~~
|
|
|
|
|
|
|
|
Parse dependencies from a source code file.
|
|
|
|
|
2014-12-23 07:24:48 +00:00
|
|
|
:copyright: (c) 2014 Alan Hamlett.
|
2014-12-23 05:12:57 +00:00
|
|
|
:license: BSD, see LICENSE for more details.
|
|
|
|
"""
|
|
|
|
|
2014-12-23 05:47:24 +00:00
|
|
|
import logging
|
2014-12-24 18:11:00 +00:00
|
|
|
import traceback
|
2014-12-23 05:47:24 +00:00
|
|
|
|
2014-12-25 05:09:15 +00:00
|
|
|
from ..compat import u, open, import_module
|
2014-12-23 05:12:57 +00:00
|
|
|
|
|
|
|
|
2014-12-23 05:47:24 +00:00
|
|
|
log = logging.getLogger('WakaTime')
|
|
|
|
|
|
|
|
|
2014-12-23 05:12:57 +00:00
|
|
|
class TokenParser(object):
|
2014-12-23 07:40:45 +00:00
|
|
|
"""The base class for all dependency parsers. To add support for your
|
|
|
|
language, inherit from this class and implement the :meth:`parse` method
|
|
|
|
to return a list of dependency strings.
|
|
|
|
"""
|
2014-12-23 05:12:57 +00:00
|
|
|
source_file = None
|
|
|
|
lexer = None
|
|
|
|
dependencies = []
|
|
|
|
tokens = []
|
|
|
|
|
|
|
|
def __init__(self, source_file, lexer=None):
|
|
|
|
self.source_file = source_file
|
|
|
|
self.lexer = lexer
|
|
|
|
|
|
|
|
def parse(self, tokens=[]):
|
|
|
|
""" Should return a list of dependencies.
|
|
|
|
"""
|
|
|
|
if not tokens and not self.tokens:
|
|
|
|
self.tokens = self._extract_tokens()
|
|
|
|
raise Exception('Not yet implemented.')
|
|
|
|
|
2014-12-25 05:09:15 +00:00
|
|
|
def append(self, dep, truncate=False, separator=None, truncate_to=None,
|
|
|
|
strip_whitespace=True):
|
|
|
|
if dep == 'as':
|
|
|
|
print('***************** as')
|
|
|
|
self._save_dependency(
|
|
|
|
dep,
|
|
|
|
truncate=truncate,
|
|
|
|
truncate_to=truncate_to,
|
|
|
|
separator=separator,
|
|
|
|
strip_whitespace=strip_whitespace,
|
|
|
|
)
|
2014-12-23 05:12:57 +00:00
|
|
|
|
|
|
|
def _extract_tokens(self):
|
2014-12-23 11:30:40 +00:00
|
|
|
if self.lexer:
|
|
|
|
with open(self.source_file, 'r', encoding='utf-8') as fh:
|
|
|
|
return self.lexer.get_tokens_unprocessed(fh.read(512000))
|
|
|
|
return []
|
2014-12-23 05:12:57 +00:00
|
|
|
|
2014-12-25 05:09:15 +00:00
|
|
|
def _save_dependency(self, dep, truncate=False, separator=None,
|
|
|
|
truncate_to=None, strip_whitespace=True):
|
|
|
|
if truncate:
|
|
|
|
if separator is None:
|
|
|
|
separator = u('.')
|
|
|
|
separator = u(separator)
|
|
|
|
dep = dep.split(separator)
|
|
|
|
if truncate_to is None or truncate_to < 0 or truncate_to > len(dep) - 1:
|
|
|
|
truncate_to = len(dep) - 1
|
|
|
|
dep = dep[0] if len(dep) == 1 else separator.join(dep[0:truncate_to])
|
|
|
|
if strip_whitespace:
|
|
|
|
dep = dep.strip()
|
2014-12-23 05:12:57 +00:00
|
|
|
if dep:
|
|
|
|
self.dependencies.append(dep)
|
|
|
|
|
|
|
|
|
|
|
|
class DependencyParser(object):
|
|
|
|
source_file = None
|
|
|
|
lexer = None
|
|
|
|
parser = None
|
|
|
|
|
|
|
|
def __init__(self, source_file, lexer):
|
|
|
|
self.source_file = source_file
|
|
|
|
self.lexer = lexer
|
|
|
|
|
2014-12-23 11:30:40 +00:00
|
|
|
if self.lexer:
|
2015-08-11 01:32:17 +00:00
|
|
|
module_name = self.lexer.__module__.rsplit('.', 1)[-1]
|
2014-12-25 06:58:56 +00:00
|
|
|
class_name = self.lexer.__class__.__name__.replace('Lexer', 'Parser', 1)
|
|
|
|
else:
|
|
|
|
module_name = 'unknown'
|
|
|
|
class_name = 'UnknownParser'
|
|
|
|
|
|
|
|
try:
|
|
|
|
module = import_module('.%s' % module_name, package=__package__)
|
2014-12-23 11:30:40 +00:00
|
|
|
try:
|
2014-12-25 06:58:56 +00:00
|
|
|
self.parser = getattr(module, class_name)
|
|
|
|
except AttributeError:
|
2014-12-25 18:39:36 +00:00
|
|
|
log.debug('Module {0} is missing class {1}'.format(module.__name__, class_name))
|
2014-12-25 06:58:56 +00:00
|
|
|
except ImportError:
|
|
|
|
log.debug(traceback.format_exc())
|
2014-12-23 05:12:57 +00:00
|
|
|
|
|
|
|
def parse(self):
|
|
|
|
if self.parser:
|
|
|
|
plugin = self.parser(self.source_file, lexer=self.lexer)
|
|
|
|
dependencies = plugin.parse()
|
|
|
|
return list(set(dependencies))
|
|
|
|
return []
|