from collections import defaultdict
from functools import partial
import inspect
import logging
from os import makedirs
from os.path import join, abspath, exists
from appdirs import user_data_dir
from coala_utils.decorators import (enforce_signature, classproperty,
get_public_members)
import requests
from coalib.results.Result import Result
from coalib.settings.ConfigurationGathering import get_config_directory
from coalib.settings.FunctionMetadata import FunctionMetadata
from coalib.settings.Section import Section
[docs]class Bear:
"""
A bear contains the actual subroutine that is responsible for checking
source code for certain specifications. However, it can actually do
whatever it wants with the files it gets.
This is the base class for every bear. If you want to write a bear, you
will probably want to look at the ``ProjectBear`` and ``FileBear`` classes
that inherit from this class.
To indicate which languages your bear supports, just give it the
``LANGUAGES`` value which should be a set of string(s):
>>> class SomeBear(Bear):
... LANGUAGES = {'C', 'CPP', 'C#', 'D'}
To indicate the requirements of the bear, assign ``REQUIREMENTS`` a set
with instances of ``PackageRequirements``.
>>> from dependency_management.requirements.PackageRequirement import (
... PackageRequirement)
>>> class SomeBear(Bear):
... REQUIREMENTS = {
... PackageRequirement('pip', 'coala_decorators', '0.2.1')}
If your bear uses requirements from a manager we have a subclass from,
you can use the subclass, such as ``PipRequirement``, without specifying
manager:
>>> from dependency_management.requirements.PipRequirement import (
... PipRequirement)
>>> class SomeBear(Bear):
... REQUIREMENTS = {PipRequirement('coala_decorators', '0.2.1')}
To specify additional attributes to your bear, use the following:
>>> class SomeBear(Bear):
... AUTHORS = {'Jon Snow'}
... AUTHORS_EMAILS = {'jon_snow@gmail.com'}
... MAINTAINERS = {'Catelyn Stark'}
... MAINTAINERS_EMAILS = {'catelyn_stark@gmail.com'}
... LICENSE = 'AGPL-3.0'
... ASCIINEMA_URL = 'https://asciinema.org/a/80761'
If the maintainers are the same as the authors, they can be omitted:
>>> class SomeBear(Bear):
... AUTHORS = {'Jon Snow'}
... AUTHORS_EMAILS = {'jon_snow@gmail.com'}
>>> SomeBear.maintainers
{'Jon Snow'}
>>> SomeBear.maintainers_emails
{'jon_snow@gmail.com'}
If your bear needs to include local files, then specify it giving strings
containing relative file paths to the INCLUDE_LOCAL_FILES set:
>>> class SomeBear(Bear):
... INCLUDE_LOCAL_FILES = {'checkstyle.jar', 'google_checks.xml'}
To keep track easier of what a bear can do, simply tell it to the
``CAN_FIX`` and the ``CAN_DETECT`` sets. Possible values are:
>>> CAN_DETECT = {'Syntax', 'Formatting', 'Security', 'Complexity',
... 'Smell', 'Unused Code', 'Redundancy', 'Variable Misuse', 'Spelling',
... 'Memory Leak', 'Documentation', 'Duplication', 'Commented Code',
... 'Grammar', 'Missing Import', 'Unreachable Code', 'Undefined Element',
... 'Code Simplification'}
>>> CAN_FIX = {'Syntax', ...}
Specifying something to ``CAN_FIX`` makes it obvious that it can be
detected too, so it may be omitted:
>>> class SomeBear(Bear):
... CAN_DETECT = {'Syntax', 'Security'}
... CAN_FIX = {'Redundancy'}
>>> sorted(SomeBear.can_detect)
['Redundancy', 'Security', 'Syntax']
Every bear has a data directory which is unique to that particular bear:
>>> class SomeBear(Bear): pass
>>> class SomeOtherBear(Bear): pass
>>> SomeBear.data_dir == SomeOtherBear.data_dir
False
A bear can be dependent from other bears. ``BEAR_DEPS`` contains bear
classes that are to be executed before this bear gets executed. The results
of these bears will then be passed inside ``self.dependency_results`` as a
dict. The dict will have the name of the bear as key and a list of its
results as values:
>>> class SomeBear(Bear): pass
>>> class SomeOtherBear(Bear):
... BEAR_DEPS = {SomeBear}
>>> SomeOtherBear.BEAR_DEPS
{<class 'coalib.core.Bear.SomeBear'>}
"""
LANGUAGES = set()
REQUIREMENTS = set()
AUTHORS = set()
AUTHORS_EMAILS = set()
MAINTAINERS = set()
MAINTAINERS_EMAILS = set()
PLATFORMS = {'any'}
LICENSE = ''
INCLUDE_LOCAL_FILES = set()
CAN_DETECT = set()
CAN_FIX = set()
ASCIINEMA_URL = ''
BEAR_DEPS = set()
@classproperty
def name(cls):
"""
:return:
The name of the bear.
"""
return cls.__name__
@classproperty
def can_detect(cls):
"""
:return:
A set that contains everything a bear can detect, including
information from what it can fix too.
"""
return cls.CAN_DETECT | cls.CAN_FIX
@classproperty
def source_location(cls):
"""
Returns the directory this bear is inside.
>>> class SomeBear(Bear): pass
>>> SomeBear.source_location
'...Bear.py'
"""
return inspect.getfile(cls)
@classproperty
def maintainers(cls):
"""
:return:
A set containing ``MAINTAINERS`` if specified, else takes
``AUTHORS`` by default.
"""
return cls.AUTHORS if cls.MAINTAINERS == set() else cls.MAINTAINERS
@classproperty
def maintainers_emails(cls):
"""
:return:
A set containing ``MAINTAINERS_EMAILS`` if specified, else takes
``AUTHORS_EMAILS`` by default.
"""
return (cls.AUTHORS_EMAILS
if cls.MAINTAINERS_EMAILS == set() else
cls.MAINTAINERS_EMAILS)
@enforce_signature
def __init__(self, section: Section, file_dict: dict):
"""
Constructs a new bear.
:param section:
The section object where bear settings are contained.
:param file_dict:
The file-dictionary containing a mapping of filenames to the
according file contents.
:raises RuntimeError:
Raised when bear requirements are not fulfilled.
"""
self.section = section
self.file_dict = file_dict
# Copy the bears specified in Bear.BEAR_DEPS to this instance, so
# runtime modifications are allowed.
self.BEAR_DEPS = set(self.BEAR_DEPS)
self._dependency_results = defaultdict(list)
self.setup_dependencies()
cp = type(self).check_prerequisites()
if cp is not True:
error_string = ('The bear ' + self.name +
' does not fulfill all requirements.')
if cp is not False:
error_string += ' ' + cp
raise RuntimeError(error_string)
@property
def dependency_results(self):
"""
Contains all dependency results.
This variable gets set during bear execution from the core and can be
used from ``analyze``.
Modifications to the returned dictionary while the core is running
leads to undefined behaviour.
>>> section = Section('my-section')
>>> file_dict = {'file1.txt': ['']}
>>> bear = Bear(section, file_dict)
>>> bear.dependency_results
defaultdict(<class 'list'>, {})
>>> dependency_bear = Bear(section, file_dict)
>>> bear.dependency_results[type(dependency_bear)] += [1, 2]
>>> bear.dependency_results
defaultdict(<class 'list'>, {<class 'coalib.core.Bear.Bear'>: [1, 2]})
:return:
A dictionary with bear-types as keys and their results received.
"""
return self._dependency_results
# FIXME Make this a @classproperty.
[docs] @classmethod
def get_non_optional_settings(cls):
"""
This method has to determine which settings are needed by this bear.
The user will be prompted for needed settings that are not available
in the settings file so don't include settings where a default value
would do.
Note: This function also queries settings from bear dependencies in
recursive manner. Though circular dependency chains are a challenge to
achieve, this function would never return on them!
:return: A dictionary of needed settings as keys and a tuple of help
text and annotation as values
"""
non_optional_settings = {}
for dependency in cls.BEAR_DEPS:
non_optional_settings.update(
dependency.get_non_optional_settings())
non_optional_settings.update(cls.get_metadata().non_optional_params)
return non_optional_settings
@classmethod
def __json__(cls):
"""
Override JSON export of ``Bear`` class.
"""
# Those members get duplicated if they aren't excluded because they
# exist also as fields.
excluded_members = {'can_detect', 'maintainers', 'maintainers_emails'}
# json cannot serialize properties, so drop them
data = {
key: value
for key, value in get_public_members(cls).items()
if not isinstance(value, property) and key not in excluded_members}
metadata = cls.get_metadata()
non_optional_params = metadata.non_optional_params
optional_params = metadata.optional_params
data['metadata'] = {
'desc': metadata.desc,
'non_optional_params': {param: non_optional_params[param][0]
for param in non_optional_params},
'optional_params': {param: optional_params[param][0]
for param in optional_params}}
return data
[docs] @staticmethod
def setup_dependencies():
"""
This is a user defined function that can download and set up
dependencies (via download_cached_file or arbitrary other means) in an
OS independent way.
"""
[docs] @classmethod
def check_prerequisites(cls):
"""
Checks whether needed runtime prerequisites of the bear are satisfied.
This function gets executed at construction.
Section value requirements shall be checked inside the ``run`` method.
>>> from dependency_management.requirements.PipRequirement import (
... PipRequirement)
>>> class SomeBear(Bear):
... REQUIREMENTS = {PipRequirement('pip')}
>>> SomeBear.check_prerequisites()
True
>>> class SomeOtherBear(Bear):
... REQUIREMENTS = {PipRequirement('really_bad_package')}
>>> SomeOtherBear.check_prerequisites()
'Following requirements are not installed: really_bad_package (...)'
:return: True if prerequisites are satisfied, else False or a string
that serves a more detailed description of what's missing.
"""
not_installed_requirements = [requirement
for requirement in cls.REQUIREMENTS
if not requirement.is_installed()]
if not_installed_requirements:
return 'Following requirements are not installed: ' + ', '.join(
'{} (installable via `{}`)'.format(
requirement.package,
' '.join(requirement.install_command()))
for requirement in not_installed_requirements)
else:
return True
[docs] def get_config_dir(self):
"""
Gives the directory where the configuration file resides.
:return:
Directory of the config file.
"""
return get_config_directory(self.section)
[docs] @classmethod
def download_cached_file(cls, url, filename):
"""
Downloads the file if needed and caches it for the next time. If a
download happens, the user will be informed.
Take a sane simple bear:
>>> section = Section('my-section')
>>> file_dict = {'file1.txt': ['']}
>>> bear = Bear(section, file_dict)
We can now carelessly query for a neat file that doesn't exist yet:
>>> from os import remove
>>> if exists(join(bear.data_dir, 'a_file')):
... remove(join(bear.data_dir, 'a_file'))
>>> file = bear.download_cached_file('https://github.com/', 'a_file')
If we download it again, it'll be much faster as no download occurs:
>>> newfile = bear.download_cached_file(
... 'https://github.com/', 'a_file')
>>> newfile == file
True
:param url:
The URL to download the file from.
:param filename:
The filename it should get, e.g. "test.txt".
:return:
A full path to the file ready for you to use!
"""
filename = join(cls.data_dir, filename)
if exists(filename):
return filename
logging.info('{}: Downloading {} into {!r}.'
.format(cls.name, url, filename))
response = requests.get(url, stream=True, timeout=20)
response.raise_for_status()
with open(filename, 'wb') as file:
for chunk in response.iter_content(125):
file.write(chunk)
return filename
@classproperty
def data_dir(cls):
"""
Returns a directory that may be used by the bear to store stuff. Every
bear has an own directory dependent on their name.
"""
data_dir = abspath(join(user_data_dir('coala-bears'), cls.name))
makedirs(data_dir, exist_ok=True)
return data_dir
@property
def new_result(self):
"""
Returns a partial for creating a result with this bear already bound.
"""
return partial(Result.from_values, self)
[docs] def execute_task(self, args, kwargs):
"""
Executes a task.
By default returns a list of results collected from this bear.
This function has to return something that is picklable to make bears
work in multi-process environments.
:param args:
The arguments of a task.
:param kwargs:
The keyword-arguments of a task.
:return:
A list of results from the bear.
"""
return list(self.analyze(*args, **kwargs))
[docs] def analyze(self, *args, **kwargs):
"""
Performs the code analysis.
:return:
An iterable of results.
"""
raise NotImplementedError('This function has to be implemented for a '
'runnable bear.')
[docs] def generate_tasks(self):
"""
This method is responsible for providing the job arguments ``analyze``
gets called with.
:return:
An iterable containing the positional and keyword arguments
organized in pairs: ``(args-tuple, kwargs-dict)``
"""
raise NotImplementedError('This function has to be implemented for a '
'runnable bear.')