Source code for biogeme.specification

######
# TO DO: combine the validity conditions with the user defined validity
# Do something with the validity message (why it is invalid)


"""Model specification in a multiple expression context

:author: Michel Bierlaire
:date: Mon Apr 10 12:33:18 2023

Implements a model specification in a multiple expression context (using Catalogs)
"""
from __future__ import annotations

import logging
from typing import TYPE_CHECKING, Callable

from biogeme_optimization.pareto import SetElement

import biogeme.biogeme as bio
import biogeme.tools.unique_ids
from biogeme.configuration import Configuration
from biogeme.exceptions import BiogemeError
from biogeme.parameters import get_default_value, Parameters
from biogeme.validity import Validity
from biogeme.results import bioResults

if TYPE_CHECKING:
    from biogeme.results import bioResults

logger = logging.getLogger(__name__)


[docs] class Specification: """Implements a specification""" database = None #: :class:`biogeme.database.Database` object all_results = {} #: dict(str: `biogeme.results.bioResults`) expression = None #: :class:`biogeme.expressions.Expression` object """ function that generates all the objectives: fct(bioResults) -> list[floatNone] """ user_defined_validity_check = None """ function that checks the validity of the results """ generic_name = 'default_name' #: short name for file names biogeme_parameters: Parameters | None = None def __init__( self, configuration: biogeme.configuration.Configuration, biogeme_parameters: Parameters | None = None, ): """Creates a specification from a configuration :param configuration: configuration of the multiple expression """ if not isinstance(configuration, Configuration): error_msg = 'Ctor needs an object of type Configuration' raise BiogemeError(error_msg) self.configuration = configuration self.model_names = None self.validity = None self.biogeme_parameters = biogeme_parameters self.maximum_number_parameters = ( get_default_value( name='maximum_number_parameters', section='AssistedSpecification' ) if biogeme_parameters is None else biogeme_parameters.get_value( name='maximum_number_parameters', section='AssistedSpecification' ) ) logger.debug(f'{self.maximum_number_parameters=}') self._estimate() assert ( self.validity is not None ), 'Validity must be set by the _estimate function' assert ( self.all_results.get(self.config_id) is not None ), 'Results have not been generated'
[docs] @classmethod def from_string_id(cls, configuration_id: str): """Constructor using a configuration""" return cls(Configuration.from_string(configuration_id))
[docs] def configure_expression(self) -> None: """Configure the expression to the current configuration""" self.expression.configure_catalogs(self.configuration)
[docs] @classmethod def default_specification(cls) -> 'Specification': """Alternative constructor for generate the default specification""" cls.expression.reset_expression_selection() the_config = cls.expression.current_configuration() return cls(the_config)
@property def config_id(self) -> str: """Defined config_id as a property""" return self.configuration.get_string_id() @config_id.setter def config_id(self, value: str) -> None: self.configuration = Configuration.from_string(value)
[docs] def get_results(self) -> bioResults: """Obtain the estimation results of the specification""" the_results = self.all_results.get(self.config_id) if the_results is None: error_msg = f'No result is available for specification {self.config_id}' raise BiogemeError(error_msg) return the_results
def __repr__(self) -> str: return str(self.config_id) def _estimate(self) -> None: """Estimate the parameter of the current specification, if not already done""" if self.expression is None: error_msg = 'No expression has been provided for the model.' raise BiogemeError(error_msg) if self.database is None: error_msg = 'No database has been provided for the estimation.' raise BiogemeError(error_msg) if self.model_names is None: self.model_names = biogeme.tools.unique_ids.ModelNames( prefix=self.generic_name ) if self.config_id in self.all_results: results = self.all_results.get(self.config_id) else: logger.debug(f'****** Estimate {self.config_id}') the_biogeme = bio.BIOGEME.from_configuration( config_id=self.config_id, expression=self.expression, database=self.database, ) number_of_parameters = the_biogeme.number_unknown_parameters() logger.info( f'Model with {number_of_parameters} unknown parameters [max: {self.maximum_number_parameters}]' ) if number_of_parameters > self.maximum_number_parameters: logger.info( f'Invalid as it exceeds the maximum number of parameters: {self.maximum_number_parameters}' ) self.validity = Validity( status=False, reason=( f'Too many parameters: {number_of_parameters} > ' f'{self.maximum_number_parameters}' ), ) self.all_results[self.config_id] = bioResults() return the_biogeme.modelName = self.model_names(self.config_id) logger.info(f'*** Estimate {the_biogeme.modelName}') the_biogeme.generate_html = False the_biogeme.generate_pickle = False results = the_biogeme.quick_estimate() self.all_results[self.config_id] = results if not results.algorithm_has_converged(): self.validity = Validity( status=False, reason=f'Optimization algorithm has not converged' ) return if self.user_defined_validity_check is not None: self.validity = self.user_defined_validity_check(results) else: self.validity = Validity(status=True, reason='')
[docs] def describe(self) -> str: """Short description of the solution. Used for reporting. :return: short description of the solution. :rtype: str """ the_results = self.get_results() if the_results is None: return f'Invalid model: {self.validity.reason}' return f'{the_results.short_summary()}'
[docs] def get_element( self, multi_objectives: Callable[[bioResults | None], list[float]] ) -> SetElement: """Obtains the element from the Pareto set corresponding to a specification :param multi_objectives: function calculating the objectives from the estimation results :type multi_objectives: fct(biogeme.results.bioResults) --> list[float] :return: element from the Pareto set :rtype: biogeme.pareto.SetElement """ the_id = self.config_id the_results = self.get_results() the_objectives = multi_objectives(the_results) element = SetElement(the_id, the_objectives) logger.debug(f'{element=}') return element