don't truncate dependencies by default. improve python dependency parser.
This commit is contained in:
parent
40c8067dbf
commit
24d066c572
6 changed files with 55 additions and 40 deletions
|
@ -12,7 +12,7 @@
|
||||||
import logging
|
import logging
|
||||||
import traceback
|
import traceback
|
||||||
|
|
||||||
from ..compat import open, import_module
|
from ..compat import u, open, import_module
|
||||||
|
|
||||||
|
|
||||||
log = logging.getLogger('WakaTime')
|
log = logging.getLogger('WakaTime')
|
||||||
|
@ -39,8 +39,17 @@ class TokenParser(object):
|
||||||
self.tokens = self._extract_tokens()
|
self.tokens = self._extract_tokens()
|
||||||
raise Exception('Not yet implemented.')
|
raise Exception('Not yet implemented.')
|
||||||
|
|
||||||
def append(self, dep, truncate=True):
|
def append(self, dep, truncate=False, separator=None, truncate_to=None,
|
||||||
self._save_dependency(dep, truncate=truncate)
|
strip_whitespace=True):
|
||||||
|
if dep == 'as':
|
||||||
|
print('***************** as')
|
||||||
|
self._save_dependency(
|
||||||
|
dep,
|
||||||
|
truncate=truncate,
|
||||||
|
truncate_to=truncate_to,
|
||||||
|
separator=separator,
|
||||||
|
strip_whitespace=strip_whitespace,
|
||||||
|
)
|
||||||
|
|
||||||
def _extract_tokens(self):
|
def _extract_tokens(self):
|
||||||
if self.lexer:
|
if self.lexer:
|
||||||
|
@ -48,8 +57,18 @@ class TokenParser(object):
|
||||||
return self.lexer.get_tokens_unprocessed(fh.read(512000))
|
return self.lexer.get_tokens_unprocessed(fh.read(512000))
|
||||||
return []
|
return []
|
||||||
|
|
||||||
def _save_dependency(self, dep, truncate=True):
|
def _save_dependency(self, dep, truncate=False, separator=None,
|
||||||
dep = dep.strip().split('.')[0].strip() if truncate else dep.strip()
|
truncate_to=None, strip_whitespace=True):
|
||||||
|
if truncate:
|
||||||
|
if separator is None:
|
||||||
|
separator = u('.')
|
||||||
|
separator = u(separator)
|
||||||
|
dep = dep.split(separator)
|
||||||
|
if truncate_to is None or truncate_to < 0 or truncate_to > len(dep) - 1:
|
||||||
|
truncate_to = len(dep) - 1
|
||||||
|
dep = dep[0] if len(dep) == 1 else separator.join(dep[0:truncate_to])
|
||||||
|
if strip_whitespace:
|
||||||
|
dep = dep.strip()
|
||||||
if dep:
|
if dep:
|
||||||
self.dependencies.append(dep)
|
self.dependencies.append(dep)
|
||||||
|
|
||||||
|
|
|
@ -31,7 +31,7 @@ class CppParser(TokenParser):
|
||||||
def _process_preproc(self, token, content):
|
def _process_preproc(self, token, content):
|
||||||
if content.strip().startswith('include ') or content.strip().startswith("include\t"):
|
if content.strip().startswith('include ') or content.strip().startswith("include\t"):
|
||||||
content = content.replace('include', '', 1).strip()
|
content = content.replace('include', '', 1).strip()
|
||||||
self.append(content, truncate=False)
|
self.append(content)
|
||||||
|
|
||||||
def _process_other(self, token, content):
|
def _process_other(self, token, content):
|
||||||
pass
|
pass
|
||||||
|
|
|
@ -30,9 +30,7 @@ class CSharpParser(TokenParser):
|
||||||
|
|
||||||
def _process_namespace(self, token, content):
|
def _process_namespace(self, token, content):
|
||||||
if content != 'import' and content != 'package' and content != 'namespace':
|
if content != 'import' and content != 'package' and content != 'namespace':
|
||||||
content = content.split('.')
|
self.append(content, truncate=True)
|
||||||
content = content[0] if len(content) == 1 else '.'.join(content[0:len(content)-1])
|
|
||||||
self.append(content, truncate=False)
|
|
||||||
|
|
||||||
def _process_other(self, token, content):
|
def _process_other(self, token, content):
|
||||||
pass
|
pass
|
||||||
|
|
|
@ -30,9 +30,7 @@ class JavaParser(TokenParser):
|
||||||
|
|
||||||
def _process_namespace(self, token, content):
|
def _process_namespace(self, token, content):
|
||||||
if content != 'import' and content != 'package' and content != 'namespace':
|
if content != 'import' and content != 'package' and content != 'namespace':
|
||||||
content = content.split('.')
|
self.append(content, truncate=True)
|
||||||
content = content[0] if len(content) == 1 else '.'.join(content[0:len(content)-1])
|
|
||||||
self.append(content, truncate=False)
|
|
||||||
|
|
||||||
def _process_other(self, token, content):
|
def _process_other(self, token, content):
|
||||||
pass
|
pass
|
||||||
|
|
|
@ -42,15 +42,11 @@ class PhpParser(TokenParser):
|
||||||
|
|
||||||
def _process_name(self, token, content):
|
def _process_name(self, token, content):
|
||||||
if self.state == 'use':
|
if self.state == 'use':
|
||||||
content = content.split("\\")
|
self.append(content, truncate=True, separator=u("\\"))
|
||||||
content = content[0] if len(content) == 1 else "\\".join(content[0:len(content)-1])
|
|
||||||
self.append(content, truncate=False)
|
|
||||||
|
|
||||||
def _process_function(self, token, content):
|
def _process_function(self, token, content):
|
||||||
if self.state == 'use function':
|
if self.state == 'use function':
|
||||||
content = content.split("\\")
|
self.append(content, truncate=True, separator=u("\\"))
|
||||||
content = content[0] if len(content) == 1 else "\\".join(content[0:len(content)-1])
|
|
||||||
self.append(content, truncate=False)
|
|
||||||
self.state = 'use'
|
self.state = 'use'
|
||||||
|
|
||||||
def _process_keyword(self, token, content):
|
def _process_keyword(self, token, content):
|
||||||
|
@ -71,7 +67,7 @@ class PhpParser(TokenParser):
|
||||||
content = content.strip()
|
content = content.strip()
|
||||||
if u(token) == 'Token.Literal.String.Double':
|
if u(token) == 'Token.Literal.String.Double':
|
||||||
content = u('"{0}"').format(content)
|
content = u('"{0}"').format(content)
|
||||||
self.append(content, truncate=False)
|
self.append(content)
|
||||||
self.state = None
|
self.state = None
|
||||||
|
|
||||||
def _process_punctuation(self, token, content):
|
def _process_punctuation(self, token, content):
|
||||||
|
|
|
@ -44,6 +44,9 @@ class PythonParser(TokenParser):
|
||||||
def _process_namespace(self, token, content):
|
def _process_namespace(self, token, content):
|
||||||
if self.state is None:
|
if self.state is None:
|
||||||
self.state = content
|
self.state = content
|
||||||
|
else:
|
||||||
|
if content == 'as':
|
||||||
|
self.nonpackage = True
|
||||||
else:
|
else:
|
||||||
self._process_import(token, content)
|
self._process_import(token, content)
|
||||||
|
|
||||||
|
@ -53,13 +56,13 @@ class PythonParser(TokenParser):
|
||||||
self.nonpackage = False
|
self.nonpackage = False
|
||||||
else:
|
else:
|
||||||
if self.state == 'from':
|
if self.state == 'from':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
if self.state == 'from-2' and content != 'import':
|
if self.state == 'from-2' and content != 'import':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
elif self.state == 'import':
|
elif self.state == 'import':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
elif self.state == 'import-2':
|
elif self.state == 'import-2':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
else:
|
else:
|
||||||
self.state = None
|
self.state = None
|
||||||
|
|
||||||
|
@ -69,13 +72,13 @@ class PythonParser(TokenParser):
|
||||||
self.nonpackage = False
|
self.nonpackage = False
|
||||||
else:
|
else:
|
||||||
if self.state == 'from':
|
if self.state == 'from':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
if self.state == 'from-2' and content != 'import':
|
if self.state == 'from-2' and content != 'import':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
elif self.state == 'import':
|
elif self.state == 'import':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
elif self.state == 'import-2':
|
elif self.state == 'import-2':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
else:
|
else:
|
||||||
self.state = None
|
self.state = None
|
||||||
|
|
||||||
|
@ -101,16 +104,17 @@ class PythonParser(TokenParser):
|
||||||
pass
|
pass
|
||||||
|
|
||||||
def _process_import(self, token, content):
|
def _process_import(self, token, content):
|
||||||
self.nonpackage = False
|
if not self.nonpackage:
|
||||||
if self.state == 'from':
|
if self.state == 'from':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
self.state = 'from-2'
|
self.state = 'from-2'
|
||||||
elif self.state == 'from-2' and content != 'import':
|
elif self.state == 'from-2' and content != 'import':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
elif self.state == 'import':
|
elif self.state == 'import':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
self.state = 'import-2'
|
self.state = 'import-2'
|
||||||
elif self.state == 'import-2':
|
elif self.state == 'import-2':
|
||||||
self.append(content)
|
self.append(content, truncate=True, truncate_to=0)
|
||||||
else:
|
else:
|
||||||
self.state = None
|
self.state = None
|
||||||
|
self.nonpackage = False
|
||||||
|
|
Loading…
Reference in a new issue