try opening files with filesystem encoding when opening with utf-8 causes UnicodeDecodeError
This commit is contained in:
parent
31a353be7a
commit
43c461a7cc
6 changed files with 50 additions and 10 deletions
|
@ -10,6 +10,7 @@
|
||||||
"""
|
"""
|
||||||
|
|
||||||
import logging
|
import logging
|
||||||
|
import sys
|
||||||
import traceback
|
import traceback
|
||||||
|
|
||||||
from ..compat import u, open, import_module
|
from ..compat import u, open, import_module
|
||||||
|
@ -53,8 +54,16 @@ class TokenParser(object):
|
||||||
|
|
||||||
def _extract_tokens(self):
|
def _extract_tokens(self):
|
||||||
if self.lexer:
|
if self.lexer:
|
||||||
|
try:
|
||||||
with open(self.source_file, 'r', encoding='utf-8') as fh:
|
with open(self.source_file, 'r', encoding='utf-8') as fh:
|
||||||
return self.lexer.get_tokens_unprocessed(fh.read(512000))
|
return self.lexer.get_tokens_unprocessed(fh.read(512000))
|
||||||
|
except:
|
||||||
|
pass
|
||||||
|
try:
|
||||||
|
with open(self.source_file, 'r', encoding=sys.getfilesystemencoding()) as fh:
|
||||||
|
return self.lexer.get_tokens_unprocessed(fh.read(512000))
|
||||||
|
except:
|
||||||
|
pass
|
||||||
return []
|
return []
|
||||||
|
|
||||||
def _save_dependency(self, dep, truncate=False, separator=None,
|
def _save_dependency(self, dep, truncate=False, separator=None,
|
||||||
|
|
|
@ -11,6 +11,7 @@
|
||||||
|
|
||||||
import logging
|
import logging
|
||||||
import os
|
import os
|
||||||
|
import sys
|
||||||
|
|
||||||
from .base import BaseProject
|
from .base import BaseProject
|
||||||
from ..compat import u, open
|
from ..compat import u, open
|
||||||
|
@ -38,8 +39,14 @@ class Git(BaseProject):
|
||||||
try:
|
try:
|
||||||
with open(head, 'r', encoding='utf-8') as fh:
|
with open(head, 'r', encoding='utf-8') as fh:
|
||||||
return u(fh.readline().strip().rsplit('/', 1)[-1])
|
return u(fh.readline().strip().rsplit('/', 1)[-1])
|
||||||
|
except UnicodeDecodeError:
|
||||||
|
try:
|
||||||
|
with open(head, 'r', encoding=sys.getfilesystemencoding()) as fh:
|
||||||
|
return u(fh.readline().strip().rsplit('/', 1)[-1])
|
||||||
|
except:
|
||||||
|
log.exception("Exception:")
|
||||||
except IOError:
|
except IOError:
|
||||||
pass
|
log.exception("Exception:")
|
||||||
return None
|
return None
|
||||||
|
|
||||||
def _project_base(self):
|
def _project_base(self):
|
||||||
|
|
|
@ -11,6 +11,7 @@
|
||||||
|
|
||||||
import logging
|
import logging
|
||||||
import os
|
import os
|
||||||
|
import sys
|
||||||
|
|
||||||
from .base import BaseProject
|
from .base import BaseProject
|
||||||
from ..compat import u, open
|
from ..compat import u, open
|
||||||
|
@ -36,8 +37,14 @@ class Mercurial(BaseProject):
|
||||||
try:
|
try:
|
||||||
with open(branch_file, 'r', encoding='utf-8') as fh:
|
with open(branch_file, 'r', encoding='utf-8') as fh:
|
||||||
return u(fh.readline().strip().rsplit('/', 1)[-1])
|
return u(fh.readline().strip().rsplit('/', 1)[-1])
|
||||||
|
except UnicodeDecodeError:
|
||||||
|
try:
|
||||||
|
with open(branch_file, 'r', encoding=sys.getfilesystemencoding()) as fh:
|
||||||
|
return u(fh.readline().strip().rsplit('/', 1)[-1])
|
||||||
|
except:
|
||||||
|
log.exception("Exception:")
|
||||||
except IOError:
|
except IOError:
|
||||||
pass
|
log.exception("Exception:")
|
||||||
return u('default')
|
return u('default')
|
||||||
|
|
||||||
def _find_hg_config_dir(self, path):
|
def _find_hg_config_dir(self, path):
|
||||||
|
|
|
@ -46,8 +46,8 @@ class Subversion(BaseProject):
|
||||||
'/usr/local/bin/svn',
|
'/usr/local/bin/svn',
|
||||||
]
|
]
|
||||||
for location in locations:
|
for location in locations:
|
||||||
with open(os.devnull, 'wb') as DEVNULL:
|
|
||||||
try:
|
try:
|
||||||
|
with open(os.devnull, 'wb') as DEVNULL:
|
||||||
Popen([location, '--version'], stdout=DEVNULL, stderr=DEVNULL)
|
Popen([location, '--version'], stdout=DEVNULL, stderr=DEVNULL)
|
||||||
self.binary_location = location
|
self.binary_location = location
|
||||||
return location
|
return location
|
||||||
|
|
|
@ -13,6 +13,7 @@
|
||||||
|
|
||||||
import logging
|
import logging
|
||||||
import os
|
import os
|
||||||
|
import sys
|
||||||
|
|
||||||
from .base import BaseProject
|
from .base import BaseProject
|
||||||
from ..compat import u, open
|
from ..compat import u, open
|
||||||
|
@ -34,6 +35,13 @@ class WakaTimeProjectFile(BaseProject):
|
||||||
with open(self.config, 'r', encoding='utf-8') as fh:
|
with open(self.config, 'r', encoding='utf-8') as fh:
|
||||||
self._project_name = u(fh.readline().strip())
|
self._project_name = u(fh.readline().strip())
|
||||||
self._project_branch = u(fh.readline().strip())
|
self._project_branch = u(fh.readline().strip())
|
||||||
|
except UnicodeDecodeError:
|
||||||
|
try:
|
||||||
|
with open(self.config, 'r', encoding=sys.getfilesystemencoding()) as fh:
|
||||||
|
self._project_name = u(fh.readline().strip())
|
||||||
|
self._project_branch = u(fh.readline().strip())
|
||||||
|
except:
|
||||||
|
log.exception("Exception:")
|
||||||
except IOError:
|
except IOError:
|
||||||
log.exception("Exception:")
|
log.exception("Exception:")
|
||||||
|
|
||||||
|
|
|
@ -143,6 +143,11 @@ def number_lines_in_file(file_name):
|
||||||
with open(file_name, 'r', encoding='utf-8') as fh:
|
with open(file_name, 'r', encoding='utf-8') as fh:
|
||||||
for line in fh:
|
for line in fh:
|
||||||
lines += 1
|
lines += 1
|
||||||
|
except:
|
||||||
|
try:
|
||||||
|
with open(file_name, 'r', encoding=sys.getfilesystemencoding()) as fh:
|
||||||
|
for line in fh:
|
||||||
|
lines += 1
|
||||||
except:
|
except:
|
||||||
return None
|
return None
|
||||||
return lines
|
return lines
|
||||||
|
@ -180,5 +185,9 @@ def get_file_contents(file_name):
|
||||||
with open(file_name, 'r', encoding='utf-8') as fh:
|
with open(file_name, 'r', encoding='utf-8') as fh:
|
||||||
text = fh.read(512000)
|
text = fh.read(512000)
|
||||||
except:
|
except:
|
||||||
pass
|
try:
|
||||||
|
with open(file_name, 'r', encoding=sys.getfilesystemencoding()) as fh:
|
||||||
|
text = fh.read(512000)
|
||||||
|
except:
|
||||||
|
log.exception("Exception:")
|
||||||
return text
|
return text
|
||||||
|
|
Loading…
Reference in a new issue