Source code for aiida.orm.implementation.general.computer

# -*- coding: utf-8 -*-
###########################################################################
# Copyright (c), The AiiDA team. All rights reserved.                     #
# This file is part of the AiiDA code.                                    #
#                                                                         #
# The code is hosted on GitHub at https://github.com/aiidateam/aiida_core #
# For further information on the license, see the LICENSE.txt file        #
# For further information please visit http://www.aiida.net               #
###########################################################################
from abc import ABCMeta, abstractmethod, abstractproperty

import logging
import os

from aiida.transport import Transport, TransportFactory
from aiida.scheduler import Scheduler, SchedulerFactory

from aiida.common.exceptions import (
    ConfigurationError, DbContentError,
    MissingPluginError, ValidationError)

from aiida.common.utils import classproperty
from aiida.common.utils import abstractclassmethod, abstractstaticmethod


[docs]class AbstractComputer(object):
    """
    Base class to map a node in the DB + its permanent repository counterpart.

    Stores attributes starting with an underscore.

    Caches files and attributes before the first save, and saves everything only on store().
    After the call to store(), attributes cannot be changed.

    Only after storing (or upon loading from uuid) metadata can be modified
    and in this case they are directly set on the db.

    In the plugin, also set the _plugin_type_string, to be set in the DB in the 'type' field.
    """
    _logger = logging.getLogger(__name__)

    @classproperty
    def _conf_attributes(self):
        """
        Return the configuration attributes to be used in the 'setup' phase.

        The return value is a list of tuples. Each tuple has three elements:
        1. an internal name (used to find the
           _set_internalname_string, and get_internalname_string methods)
        2. a short human-readable name
        3. A long human-readable description
        4. True if it is a multi-line input, False otherwise

        For the implementation, see in aiida.cmdline.computer

        .. note: you can define a ``_shouldcall_internalname`` method that returns
          either True or False if the specific configuration option has to be
          called or not. If such a method is not found, the option is always
          asked to the user. In this case, you typically also want to define a
          ``_cleanup_internalname`` method to remove any previous configuration
          associated to internalname, in case ``_shouldcall_internalname``
          returns False.

        .. note: IMPORTANT! For each entry, remember to define the
          ``_set_internalname_string`` and ``get_internalname_string`` methods.
          Moreover, the ``_set_internalname_string`` method should also
          immediately validate the value.

        ..note: Defining it as a property increases the overall execution
          of the code because it does not require to calculate
          Transport.get_valid_transports() at each load of this class.
        """

        return [
            ("hostname",
             "Fully-qualified hostname",
             "The fully qualified host-name of this computer",
             False,
             ),
            ("description",
             "Description",
             "A human-readable description of this computer",
             False,
             ),
            ("enabled_state",
             "Enabled",
             "True or False; if False, the computer is disabled and calculations\n"
             "associated with it will not be submitted",
             False,
             ),
            ("transport_type",
             "Transport type",
             "The name of the transport to be used. Valid names are: {}".format(
                 ",".join(Transport.get_valid_transports())),
             False,
             ),
            ("scheduler_type",
             "Scheduler type",
             "The name of the scheduler to be used. Valid names are: {}".format(
                 ",".join(Scheduler.get_valid_schedulers())),
             False,
             ),
            ("shebang",
             "shebang line at the beginning of the submission script",
             "this line specifies the first line of the submission script for this computer",
             False,
             ),
            ("workdir",
             "AiiDA work directory",
             "The absolute path of the directory on the computer where AiiDA will\n"
             "run the calculations (typically, the scratch of the computer). You\n"
             "can use the {username} replacement, that will be replaced by your\n"
             "username on the remote computer",
             False,
             ),
            # Must be called after the scheduler!
            ("mpirun_command",
             "mpirun command",
             "The mpirun command needed on the cluster to run parallel MPI\n"
             "programs. You can use the {tot_num_mpiprocs} replacement, that will be \n"
             "replaced by the total number of cpus, or the other scheduler-dependent\n"
             "replacement fields (see the scheduler docs for more information)",
             False,
             ),
            ("default_mpiprocs_per_machine",
             "Default number of CPUs per machine",
             "Enter here the default number of CPUs per machine (node) that \n"
             "should be used if nothing is otherwise specified. Leave empty \n"
             "if you do not want to provide a default value.\n",
             False,
             ),
            ("prepend_text",
             "Text to prepend to each command execution",
             "This is a multiline string, whose content will be prepended inside\n"
             "the submission script before the real execution of the job. It is\n"
             "your responsibility to write proper bash code!",
             True,
             ),
            ("append_text",
             "Text to append to each command execution",
             "This is a multiline string, whose content will be appended inside\n"
             "the submission script after the real execution of the job. It is\n"
             "your responsibility to write proper bash code!",
             True,
             ),
        ]

    def __int__(self):
        """
        Convert the class to an integer. This is needed to allow querying with Django.
        Be careful, though, not to pass it to a wrong field! This only returns the
        local DB principal key value.
        """
        return self.pk

    @abstractproperty
    def uuid(self):
        """
        Return the UUID in the DB.
        """
        pass

    @abstractproperty
    def pk(self):
        """
        Return the principal key in the DB.
        """
        pass

    @abstractproperty
    def id(self):
        """
        Return the principal key in the DB.
        """
        pass

    @abstractmethod
    def __init__(self, **kwargs):
        pass

    @abstractmethod
    def set(self, **kwargs):
        pass

[docs]    @abstractstaticmethod
    def get_db_columns():
        """
        This method returns a list with the column names and types of the
        table
        corresponding to this class.
        :return: a list with the names of the columns
        """
        pass

[docs]    @abstractclassmethod
    def list_names(cls):
        """
        Return a list with all the names of the computers in the DB.
        """
        pass

    @abstractproperty
    def full_text_info(self):
        """
        Return a (multiline) string with a human-readable detailed information
        on this computer.
        """
        pass

    @abstractproperty
    def to_be_stored(self):
        pass

[docs]    @abstractclassmethod
    def get(cls, computer):
        """
        Return a computer from its name (or from another Computer or DbComputer instance)
        """
        pass

    @property
    def logger(self):
        return self._logger

[docs]    @classmethod
    def _name_validator(cls, name):
        """
        Validates the name.
        """
        if not name.strip():
            raise ValidationError("No name specified")

    def _get_hostname_string(self):
        return self.get_hostname()

[docs]    def _set_hostname_string(self, string):
        """
        Set the hostname starting from a string.
        """
        self._hostname_validator(string)
        self.set_hostname(string)

[docs]    @classmethod
    def _hostname_validator(cls, hostname):
        """
        Validates the hostname.
        """
        if not hostname.strip():
            raise ValidationError("No hostname specified")

[docs]    def _get_default_mpiprocs_per_machine_string(self):
        """
        Get the default number of CPUs per machine (node) as a string
        """
        def_cpus_per_machine = self.get_default_mpiprocs_per_machine()
        if def_cpus_per_machine is None:
            return ""
        else:
            return str(def_cpus_per_machine)

[docs]    def _set_default_mpiprocs_per_machine_string(self, string):
        """
        Set the default number of CPUs per machine (node) from a string (set to
        None if the string is empty)
        """
        if not string:
            def_cpus_per_machine = None
        else:
            try:
                def_cpus_per_machine = int(string)
            except ValueError:
                raise ValidationError("Invalid value for default_mpiprocs_per_machine, "
                                      "must be a positive integer, or an empty "
                                      "string if you do not want to provide a "
                                      "default value.")

        self._default_mpiprocs_per_machine_validator(def_cpus_per_machine)

        self.set_default_mpiprocs_per_machine(def_cpus_per_machine)

[docs]    def _default_mpiprocs_per_machine_validator(self, def_cpus_per_machine):
        """
        Validates the default number of CPUs per machine (node)
        """
        if def_cpus_per_machine is None:
            return

        if not isinstance(def_cpus_per_machine, (
                int, long)) or def_cpus_per_machine <= 0:
            raise ValidationError("Invalid value for default_mpiprocs_per_machine, "
                                  "must be a positive integer, or an empty "
                                  "string if you do not want to provide a "
                                  "default value.")

[docs]    def _shouldcall_default_mpiprocs_per_machine(self):
        """
        Return True if the scheduler can accept 'default_mpiprocs_per_machine',
        False otherwise.

        If there is a problem in determining the scheduler, return True to
        avoid exceptions.
        """
        try:
            SchedulerClass = SchedulerFactory(self.get_scheduler_type())
        except MissingPluginError:
            # Return True if the Scheduler was not found...
            return True

        JobResourceClass = SchedulerClass._job_resource_class
        if JobResourceClass is None:
            # Odd situation...
            return False

        return JobResourceClass.accepts_default_mpiprocs_per_machine()

[docs]    def _cleanup_default_mpiprocs_per_machine(self):
        """
        Called by the command line utility in case the _shouldcall_ routine
        returns False, to remove possible values that were previously set
        (e.g. if one used before a pbspro scheduler and set the
        default_mpiprocs_per_machine, and then switches to sge, the question is
        not asked, but the value should also be removed from the DB.
        """
        self.set_default_mpiprocs_per_machine(None)

    def _get_enabled_state_string(self):
        return "True" if self.is_enabled() else "False"

[docs]    def _set_enabled_state_string(self, string):
        """
        Set the enabled state starting from a string.
        """
        upper_string = string.upper()
        if upper_string in ['YES', 'Y', 'T', 'TRUE']:
            enabled_state = True
        elif upper_string in ['NO', 'N', 'F', 'FALSE']:
            enabled_state = False
        else:
            raise ValidationError("Invalid value '{}' for the enabled state, must "
                                  "be a boolean".format(string))

        self._enabled_state_validator(enabled_state)

        self.set_enabled_state(enabled_state)

[docs]    @classmethod
    def _enabled_state_validator(cls, enabled_state):
        """
        Validates the hostname.
        """
        if not isinstance(enabled_state, bool):
            raise ValidationError("Invalid value '{}' for the enabled state, must "
                                  "be a boolean".format(str(enabled_state)))

    def _get_description_string(self):
        return self.get_description()

[docs]    def _set_description_string(self, string):
        """
        Set the description starting from a string.
        """
        self._description_validator(string)
        self.set_description(string)

[docs]    @classmethod
    def _description_validator(cls, description):
        """
        Validates the description.
        """
        # The description is always valid
        pass

    def _get_transport_type_string(self):
        return self.get_transport_type()

[docs]    def _set_transport_type_string(self, string):
        """
        Set the transport_type starting from a string.
        """
        self._transport_type_validator(string)
        self.set_transport_type(string)

[docs]    @classmethod
    def _transport_type_validator(cls, transport_type):
        """
        Validates the transport string.
        """
        if transport_type not in Transport.get_valid_transports():
            raise ValidationError("The specified transport is not a valid one")

    def _get_scheduler_type_string(self):
        return self.get_scheduler_type()

[docs]    def _set_scheduler_type_string(self, string):
        """
        Set the scheduler_type starting from a string.
        """
        self._scheduler_type_validator(string)
        self.set_scheduler_type(string)

[docs]    @classmethod
    def _scheduler_type_validator(cls, scheduler_type):
        """
        Validates the transport string.
        """
        if scheduler_type not in Scheduler.get_valid_schedulers():
            raise ValidationError("The specified scheduler is not a valid one")

    def _get_prepend_text_string(self):
        return self.get_prepend_text()

[docs]    def _set_prepend_text_string(self, string):
        """
        Set the prepend_text starting from a string.
        """
        self._prepend_text_validator(string)
        self.set_prepend_text(string)

[docs]    @classmethod
    def _prepend_text_validator(cls, prepend_text):
        """
        Validates the prepend text string.
        """
        # no validation done
        pass

    def _get_append_text_string(self):
        return self.get_append_text()

[docs]    def _set_append_text_string(self, string):
        """
        Set the append_text starting from a string.
        """
        self._append_text_validator(string)
        self.set_append_text(string)

[docs]    @classmethod
    def _append_text_validator(cls, append_text):
        """
        Validates the append text string.
        """
        # no validation done
        pass

    def _get_workdir_string(self):
        return self.get_workdir()

[docs]    def _set_workdir_string(self, string):
        """
        Set the workdir starting from a string.
        """
        self._workdir_validator(string)
        self.set_workdir(string)


    def _get_shebang_string(self):
        return self.get_shebang()

[docs]    def _set_shebang_string(self, string):
        """
        Set the shebang line.
        """
        # self._shebang_validator(string)
        # Should we validate?
        self.set_shebang(string)

[docs]    @classmethod
    def _workdir_validator(cls, workdir):
        """
        Validates the transport string.
        """
        if not workdir.strip():
            raise ValidationError("No workdir specified")

        try:
            convertedwd = workdir.format(username="test")
        except KeyError as e:
            raise ValidationError("In workdir there is an unknown replacement "
                                  "field '{}'".format(e.message))
        except ValueError as e:
            raise ValidationError("Error in the string: '{}'".format(e.message))

        if not os.path.isabs(convertedwd):
            raise ValidationError("The workdir must be an absolute path")

    def _get_mpirun_command_string(self):
        return " ".join(self.get_mpirun_command())

[docs]    def _set_mpirun_command_string(self, string):
        """
        Set the mpirun command string (from a string to a list).
        """
        converted_cmd = str(string).strip().split(" ")
        if converted_cmd == ['']:
            converted_cmd = []
        self._mpirun_command_validator(converted_cmd)
        self.set_mpirun_command(converted_cmd)

[docs]    def _mpirun_command_validator(self, mpirun_cmd):
        """
        Validates the mpirun_command variable. MUST be called after properly
        checking for a valid scheduler.
        """
        if not isinstance(mpirun_cmd, (tuple, list)) or not (
                all(isinstance(i, basestring) for i in mpirun_cmd)):
            raise ValidationError("the mpirun_command must be a list of strings")

        try:
            job_resource_keys = self.get_scheduler()._job_resource_class.get_valid_keys()
        except MissingPluginError:
            raise ValidationError("Unable to load the scheduler for this computer")

        subst = {i: 'value' for i in job_resource_keys}
        subst['tot_num_mpiprocs'] = 'value'

        try:
            for arg in mpirun_cmd:
                arg.format(**subst)
        except KeyError as e:
            raise ValidationError("In workdir there is an unknown replacement "
                                  "field '{}'".format(e.message))
        except ValueError as e:
            raise ValidationError("Error in the string: '{}'".format(e.message))

[docs]    def validate(self):
        """
        Check if the attributes and files retrieved from the DB are valid.
        Raise a ValidationError if something is wrong.

        Must be able to work even before storing: therefore, use the get_attr and similar methods
        that automatically read either from the DB or from the internal attribute cache.

        For the base class, this is always valid. Subclasses will reimplement this.
        In the subclass, always call the super().validate() method first!
        """
        if not self.get_name().strip():
            raise ValidationError("No name specified")

        self._hostname_validator(self.get_hostname())

        self._description_validator(self.get_description())

        self._enabled_state_validator(self.is_enabled())

        self._transport_type_validator(self.get_transport_type())

        self._scheduler_type_validator(self.get_scheduler_type())

        self._workdir_validator(self.get_workdir())

        try:
            mpirun_cmd = self.get_mpirun_command()
        except DbContentError:
            raise ValidationError("Error in the DB content of the transport_params")

        # To be called AFTER the validation of the scheduler
        self._mpirun_command_validator(mpirun_cmd)

[docs]    @abstractmethod
    def copy(self):
        """
        Return a copy of the current object to work with, not stored yet.
        """
        pass

    @abstractproperty
    def dbcomputer(self):
        pass

[docs]    @abstractmethod
    def store(self):
        """
        Store the computer in the DB.

        Differently from Nodes, a computer can be re-stored if its properties
        are to be changed (e.g. a new mpirun command, etc.)
        """
        pass

    @abstractproperty
    def name(self):
        pass

    @abstractproperty
    def description(self):
        pass

    @abstractproperty
    def hostname(self):
        pass

    @abstractmethod
    def _get_metadata(self):
        pass

[docs]    @abstractmethod
    def _set_metadata(self, metadata_dict):
        """
        Set the metadata.

        .. note: You still need to call the .store() method to actually save
           data to the database! (The store method can be called multiple
           times, differently from AiiDA Node objects).
        """
        pass

    def _del_property(self, k, raise_exception=True):
        olddata = self._get_metadata()
        try:
            del olddata[k]
        except KeyError:
            if raise_exception:
                raise AttributeError("'{}' property not found".format(k))
            else:
                # Do not reset the metadata, it is not necessary
                return
        self._set_metadata(olddata)

    def _set_property(self, k, v):
        olddata = self._get_metadata()
        olddata[k] = v
        self._set_metadata(olddata)

    def _get_property(self, k, *args):
        if len(args) > 1:
            raise TypeError("_get_property expected at most 2 arguments")
        olddata = self._get_metadata()
        try:
            return olddata[k]
        except KeyError:
            if len(args) == 0:
                raise AttributeError("'{}' property not found".format(k))
            elif len(args) == 1:
                return args[0]

    def get_prepend_text(self):
        return self._get_property("prepend_text", "")

    def set_prepend_text(self, val):
        self._set_property("prepend_text", unicode(val))

    def get_append_text(self):
        return self._get_property("append_text", "")

    def set_append_text(self, val):
        self._set_property("append_text", unicode(val))

[docs]    def get_mpirun_command(self):
        """
        Return the mpirun command. Must be a list of strings, that will be
        then joined with spaces when submitting.

        I also provide a sensible default that may be ok in many cases.
        """
        return self._get_property("mpirun_command",
                                  ["mpirun", "-np", "{tot_num_mpiprocs}"])

[docs]    def set_mpirun_command(self, val):
        """
        Set the mpirun command. It must be a list of strings (you can use
        string.split() if you have a single, space-separated string).
        """
        if not isinstance(val, (tuple, list)) or not (
                all(isinstance(i, basestring) for i in val)):
            raise TypeError("the mpirun_command must be a list of strings")
        self._set_property("mpirun_command", val)

[docs]    def get_default_mpiprocs_per_machine(self):
        """
        Return the default number of CPUs per machine (node) for this computer,
        or None if it was not set.
        """
        return self._get_property("default_mpiprocs_per_machine",
                                  None)

[docs]    def set_default_mpiprocs_per_machine(self, def_cpus_per_machine):
        """
        Set the default number of CPUs per machine (node) for this computer.
        Accepts None if you do not want to set this value.
        """
        if def_cpus_per_machine is None:
            self._del_property("default_mpiprocs_per_machine", raise_exception=False)
        else:
            if not isinstance(def_cpus_per_machine, (int, long)):
                raise TypeError("def_cpus_per_machine must be an integer (or None)")
        self._set_property("default_mpiprocs_per_machine", def_cpus_per_machine)

    @abstractmethod
    def get_transport_params(self):
        pass

    @abstractmethod
    def set_transport_params(self, val):
        pass

    @abstractmethod
    def get_workdir(self):
        pass

    @abstractmethod
    def get_shebang(self):
        pass

    @abstractmethod
    def set_workdir(self, val):
        pass

[docs]    def set_shebang(self, val):
        """
        :param str val: A valid shebang line
        """
        if not isinstance(val, basestring):
            raise ValueError("{} is invalid. Input has to be a string".format(val))
        if not val.startswith('#!'):
            raise ValueError("{} is invalid. A shebang line has to start with #!".format(val))
        metadata = self._get_metadata()
        metadata['shebang'] = val
        self._set_metadata(metadata)

    @abstractmethod
    def get_name(self):
        pass

    @abstractmethod
    def set_name(self, val):
        pass

    def get_hostname(self):
        pass

    @abstractmethod
    def set_hostname(self, val):
        pass

    @abstractmethod
    def get_description(self):
        pass

    @abstractmethod
    def set_description(self, val):
        pass

    @abstractmethod
    def get_calculations_on_computer(self):
        pass

    @abstractmethod
    def is_enabled(self):
        pass

[docs]    @abstractmethod
    def get_dbauthinfo(self, user):
        """
        Return the aiida.backends.djsite.db.models.DbAuthInfo instance for the
        given user on this computer, if the computer
        is not configured for the given user.

        :param user: a DbUser instance.
        :return: a aiida.backends.djsite.db.models.DbAuthInfo instance
        :raise NotExistent: if the computer is not configured for the given
            user.
        """
        pass

[docs]    @abstractmethod
    def is_user_configured(self, user):
        """
        Return True if the computer is configured for the given user,
        False otherwise.

        :param user: a DbUser instance.
        :return: a boolean.
        """
        pass

[docs]    @abstractmethod
    def is_user_enabled(self, user):
        """
        Return True if the computer is enabled for the given user (looking only
        at the per-user setting: the computer could still be globally disabled).

        :note: Return False also if the user is not configured for the computer.

        :param user: a DbUser instance.
        :return: a boolean.
        """
        pass

    @abstractmethod
    def set_enabled_state(self, enabled):
        pass

    @abstractmethod
    def get_scheduler_type(self):
        pass

    @abstractmethod
    def set_scheduler_type(self, val):
        pass

    @abstractmethod
    def get_transport_type(self):
        pass

    @abstractmethod
    def set_transport_type(self, val):
        pass

    def get_transport_class(self):
        try:
            # I return the class, not an instance
            return TransportFactory(self.get_transport_type())
        except MissingPluginError as e:
            raise ConfigurationError('No transport found for {} [type {}], message: {}'.format(
                self.name, self.get_transport_type(), e.message))

    def get_scheduler(self):
        try:
            ThisPlugin = SchedulerFactory(self.get_scheduler_type())
            # I call the init without any parameter
            return ThisPlugin()
        except MissingPluginError as e:
            raise ConfigurationError('No scheduler found for {} [type {}], message: {}'.format(
                self.name, self.get_scheduler_type(), e.message))

    def __repr__(self):
        return '<{}: {}>'.format(self.__class__.__name__, str(self))

    def __str__(self):
        if self.is_enabled():
            return "{} ({}), pk: {}".format(self.name, self.hostname,
                                            self.pk)
        else:
            return "{} ({}) [DISABLED], pk: {}".format(self.name, self.hostname,
                                                       self.pk)


class Util(object):
    __metaclass__ = ABCMeta

    @abstractmethod
    def delete_computer(self, pk):
        pass