"""Module defining the Model class.
This module defines the Model class, the main object of the CVXLab package,
in charge of getting the main model settings and paths, and providing all the
methods useful for the user to handle the model and its main functionalities.
The Model class integrates various components such as logging, file management,
and core functionalities, ensuring a cohesive workflow from numerical problem
conceptualization, database generation and data input, numerical problem generation
and solution, results export to database.
The Model class embeds the generation of the Core class, which provides the centralized
data indexing, functionalities for SQLite database management, problem formulation
and solution through cvxpy package.
"""
from pathlib import Path
from typing import Any, List, Optional
import pandas as pd
from cvxlab.defaults import Defaults
from cvxlab.backend.core import Core
from cvxlab.log_exc import exceptions as exc
from cvxlab.log_exc.logger import Logger
from cvxlab.support.dotdict import DotDict
from cvxlab.support.file_manager import FileManager
from cvxlab.support import util
[docs]
class Model:
"""Central class for generating and handling a CVXLab models.
The Model class represents a modeling environment that handles SQLite data
generation and processing, database interactions, numerical optimization
model generation and handling with cvxpy package.
This class initializes with a configuration for managing directories,
logging, and file management for a specific model. It also sets up various
components including a logger, file manager, and core functionalities.
Attributes:
- logger (Logger): Logger object for logging information, warnings, and errors.
- files (FileManager): An instance of FileManager to manage file operations.
- settings (DotDict): A dictionary-like object storing configurations such as \
model name, file paths, and operational flags.
- paths (DotDict): A dictionary-like object storing the paths for model \
directories and associated files.
- core (Core): An instance of Core that manages the core functionality of the \
model (it embeds Index, Database and Problem instances).
"""
[docs]
def __init__(
self,
model_dir_name: str = 'model',
main_dir_path: Optional[str] = None,
model_settings_from: Defaults.LiteralTypes.SettingsSource = 'xlsx',
detailed_validation: bool = False,
use_existing_data: bool = False,
multiple_input_files: bool = False,
input_data_files_type: Defaults.LiteralTypes.DataFileType = 'xlsx',
log_level: Defaults.LiteralTypes.LogLevel = 'info',
log_format: Defaults.LiteralTypes.LogFormat = 'standard',
):
"""Initialize the Model instance with specified configurations.
This constructor sets up the Model instance by initializing logging,
file management, and core functionalities. It also checks for the
existence of the model directory and required setup files. If the
'use_existing_data' flag is set to True, it loads existing sets data
and variable coordinates to the Model.Index and initializes numerical
problems (the configuration files and model database should have been
already generated).
Args:
model_dir_name (str): The name of the model directory.
main_dir_path (str): The main directory path where the model
directory is located. If None, the current working directory is used.
model_settings_from (Defaults.LiteralTypes.SettingsSource, optional):
The format of the model settings file. Can be either 'yml' or 'xlsx'.
Defaults to 'xlsx'.
detailed_validation (bool, optional): if True, performs detailed
validation logging of data and model settings during initialization.
Defaults to False.
use_existing_data (bool, optional): if True, generation of Model
instance is also loading model coordinates and initializing
numerical problems. Note that setup files and model database should
have been already generated. Defaults to False.
multiple_input_files (bool, optional): if True, input data Excel files
are generated as one file per data table. If False, all data tables
are generated in a single Excel file with multiple tabs. Defaults
to False.
input_data_files_type (Defaults.LiteralTypes.DataFileType, optional):
The format of the input data files. Can be either 'xlsx' or 'csv'.
Defaults to 'xlsx'.
log_level (Defaults.LiteralTypes.LogLevel, optional):
The logging level for the logger. Defaults to 'info'.
log_format (Defaults.LiteralTypes.LogFormat, optional): The logging
format for the logger. Defaults to 'standard'.
"""
config = Defaults.ConfigFiles
if main_dir_path is None:
main_dir_path = str(Path.cwd())
model_dir_path = Path(main_dir_path) / model_dir_name
self.logger = Logger(
logger_name=str(self),
log_level=log_level.upper(),
log_format=log_format,
)
with self.logger.log_timing(
message=f"Model instance generation...",
level='info',
):
self.files = FileManager(logger=self.logger)
self.settings = DotDict({
'log_level': log_level,
'model_name': model_dir_name,
'model_settings_from': model_settings_from,
'use_existing_data': use_existing_data,
'multiple_input_files': multiple_input_files,
'input_data_files_type': input_data_files_type,
'detailed_validation': detailed_validation,
})
self.paths = DotDict({
'model_dir': model_dir_path,
'input_data_dir': model_dir_path / config.INPUT_DATA_DIR,
'sets_excel_file': model_dir_path / config.SETS_FILE,
'sqlite_database': model_dir_path / config.SQLITE_DATABASE_FILE,
})
self._check_model_dir()
self._check_settings_consistency()
self._import_custom_scripts()
self.core = Core(
logger=self.logger,
files=self.files,
settings=self.settings,
paths=self.paths,
)
if self.settings['use_existing_data']:
self._load_model_coordinates()
self._initialize_problems()
@property
def sets(self) -> List[str]:
"""List of sets names available in the model.
Returns:
List[str]: A list of set names.
"""
return self.core.index.list_sets
@property
def data_tables(self) -> List[str]:
"""List of data tables names available in the model.
Returns:
List[str]: A list of data table names.
"""
return self.core.index.list_data_tables
@property
def variables(self) -> List[str]:
"""List of variables names available in the model.
Returns:
List[str]: A list of variable names.
"""
return self.core.index.list_variables
@property
def is_problem_solved(self) -> bool:
"""Status of the problem solution.
Checks if the numerical problem has been solved (even if it has not
found a numerical solution).
Returns:
bool: True if the problem has been solved, False otherwise.
"""
if self.core.problem.problem_status is None:
return False
else:
return True
def _check_model_dir(self) -> None:
"""Validate the existence of the model directory and required files.
This method checks if the model directory and all the required files exist.
This method is called during the initialization of the Model instance, and
it is not meant to be called directly by the user.
Depending on the 'use_existing_data' flag, the method checks for the existence
of different files: if the flag is set to False, it checks for the existence
of the basic model settings files (.yml or .xlsx). If the flag is set to
True, it also includes in the check the existence of the SQLite database file,
the sets Excel file, and the input data directory.
Raises:
exc.SettingsError: If the 'model_settings_from' parameter is not recognized.
exc.SettingsError: If the model directory or any of the required
setup files are missing.
"""
files_type = self.settings['model_settings_from']
model_dir_path = self.paths['model_dir']
files_to_check = []
subdir_to_check = []
util.validate_selection(
valid_selections=Defaults.ConfigFiles.AVAILABLE_SETUP_SOURCES,
selection=files_type,
)
if files_type == 'yml':
files_to_check += [
file + '.yml'
for file in Defaults.ConfigFiles.SETUP_INFO.values()
]
elif files_type == 'xlsx':
files_to_check += [Defaults.ConfigFiles.SETUP_XLSX_FILE]
if self.settings['use_existing_data']:
files_to_check += [
Defaults.ConfigFiles.SETS_FILE,
Defaults.ConfigFiles.SQLITE_DATABASE_FILE,
]
subdir_to_check += [Defaults.ConfigFiles.INPUT_DATA_DIR]
err_msg = []
if not Path(model_dir_path).exists():
self.logger.error(
"Model directory validation | Model directory is missing."
)
raise exc.SettingsError("Model directory validation | Failed.")
for subdir in subdir_to_check:
if not Path(model_dir_path / subdir).exists():
err_msg.append(
f"Model directory validation | '{subdir}' directory is missing."
)
for file in files_to_check:
if not Path(model_dir_path / file).exists():
err_msg.append(
f"Model directory validation | '{file}' file is missing."
)
if err_msg == []:
self.logger.debug(
f"Model directory validation | Success.")
else:
[self.logger.error(msg) for msg in err_msg]
raise exc.SettingsError("Model directory validation | Failed.")
def _check_settings_consistency(self) -> None:
"""Check consistency of model settings.
This method checks the consistency of the model settings, ensuring that
the configurations provided by the user are coherent.
This method is called during the initialization of the Model instance, and
it is not meant to be called directly by the user.
Raises:
exc.SettingsError: If any inconsistency or invalid configuration
is found in the model settings.
"""
err_msg = []
# Check that input data csv files are only used for multiple input files
if self.settings['input_data_files_type'] == 'csv' and not \
self.settings['multiple_input_files']:
err_msg.append(
"Input data files of type 'csv' can only be used when "
"'multiple_input_files' setting is True."
)
# Add further checks below...
if err_msg == []:
self.logger.debug(
f"Model settings validation | Success.")
else:
[self.logger.error(msg) for msg in err_msg]
raise exc.SettingsError("Model settings validation | Failed.")
def _import_custom_scripts(self) -> None:
"""Import user-defined custom operators and constants.
This method automatically imports user-defined custom operators and constants from
the model directory if the corresponding files are present. No user flags required.
Raises:
FileNotFoundError: If the specified custom operators or constants
files are not found in the model directory.
"""
custom_scripts = {
'operators': {
'file_name': Defaults.ConfigFiles.CUSTOM_OPERATORS_FILE_NAME,
'target_registry': Defaults.SymbolicDefinitions.ALLOWED_OPERATORS,
},
'constants': {
'file_name': Defaults.ConfigFiles.CUSTOM_CONSTANTS_FILE_NAME,
'target_registry': Defaults.SymbolicDefinitions.ALLOWED_CONSTANTS,
}
}
for script_type, config in custom_scripts.items():
custom_functions = self.files.load_functions_from_module(
dir_path=self.paths['model_dir'],
file_name=config['file_name'],
)
if not custom_functions:
self.logger.debug(
f"Custom '{script_type}' import | Function(s) not defined "
f"or '{config['file_name']}' not found."
)
continue
# register functions
for function in custom_functions:
function_name = function.__name__
config['target_registry'][function_name] = function
self.logger.debug(
f"Custom '{script_type}' import | Imported "
f"{len(custom_functions)} custom "
f"function{'s' if len(custom_functions) != 1 else ''} "
f"from '{config['file_name']}'."
)
def _load_model_coordinates(self) -> None:
"""Load sets data and define data tables/variables coordinates.
This method fetches sets data from Excel to sets instances. It then
loads such data (referred as coordinates) to data tables and to variables.
Then, it filter variables coordinates based on user defined filters, and
checks variables coherence.
If the 'use_existing_data' flag is set to True, this method is called
during the initialization of the Model instance, and it is not meant to
be called directly by the user.
If the 'use_existing_data' flag is set to False, this method is called
into Model.prepare_model_environment, after having defined model settings
(data tables, variables, symbolic problem), generated the model instance,
and having filled the sets Excel file with model coordinates.
Raises:
exc.SettingsError: If the sets Excel file specified in the settings
is missing.
"""
with self.logger.log_timing(
message=f"Loading sets and variables coordinates...",
level='info',
):
try:
sets_xlsx_file = Defaults.ConfigFiles.SETS_FILE
self.core.index.load_sets_data_to_index(
excel_file_name=sets_xlsx_file,
excel_file_dir_path=self.paths['model_dir']
)
except FileNotFoundError as e:
msg = f"'{sets_xlsx_file}' file missing. Set 'use_existing_data' " \
"to False to generate a new settings file."
self.logger.error(msg)
raise exc.SettingsError(msg) from e
self.core.index.load_coordinates_to_data_index()
self.core.index.load_all_coordinates_to_variables_index()
self.core.index.filter_coordinates_in_variables_index()
self.core.index.check_variables_coherence()
self.core.index.fetch_foreign_keys_to_data_tables()
def _initialize_blank_data_structure(self) -> None:
"""Initialize blank data structure for the model.
This method generates the fundamental blank data structure for the model.
If the SQLite database already exists, it gives the option to erase it
and generate a new one, or to work with the existing SQLite database.
Same for the input data directory.
Specifically, the method creates:
- A blank SQLite database with set tables and data tables, filling data
tables with sets information.
- A blank Excel input data file/s with normalized data tables for getting
exogenous variables data from the user.
"""
use_existing_data = self.settings['use_existing_data']
sqlite_db_name = Defaults.ConfigFiles.SQLITE_DATABASE_FILE
sqlite_db_path = Path(self.paths['sqlite_database'])
input_files_dir_path = Path(self.paths['input_data_dir'])
erased_db = False
erased_input_dir = False
if use_existing_data:
self.logger.info(
"Relying on existing SQLite database and input excel file/s.")
return
with self.logger.log_timing(
message=f"Generation of blank data structures...",
level='info',
):
if sqlite_db_path.exists():
erased_db = self.files.erase_file(
dir_path=self.paths['model_dir'],
file_name=sqlite_db_name,
force_erase=False,
confirm=True,
)
if erased_db:
self.logger.info(
f"Existing SQLite database '{sqlite_db_name}' erased.")
if erased_db or not sqlite_db_path.exists():
self.logger.info(
f"Creating new blank SQLite database '{sqlite_db_name}'.")
self.core.database.create_blank_sqlite_database()
self.core.database.load_sets_to_sqlite_database()
self.core.database.generate_blank_sqlite_data_tables()
self.core.database.sets_data_to_sql_data_tables()
else:
self.logger.info(
f"Relying on existing SQLite database '{sqlite_db_name}' ")
if input_files_dir_path.exists():
erased_input_dir = self.files.erase_dir(
dir_path=input_files_dir_path,
force_erase=False,
)
if erased_input_dir:
self.logger.info("Existing input data directory erased.")
if erased_input_dir or not input_files_dir_path.exists():
self.logger.info(
"Generating new blank input data directory and related file/s.")
self.core.database.generate_blank_data_input_files()
else:
self.logger.info("Relying on existing input data directory.")
def _load_exogenous_data_to_sqlite_database(
self,
force_overwrite: bool = False,
table_key_list: list[str] = [],
) -> None:
"""Load exogenous (input) data to the SQLite database.
This method loads exogenous (input) data from Excel file/s to the
SQLite database. It also fills NaN values in the database with Null
values, to ensure proper handling of missing data in SQLite.
This method is called directly by the user after having filled the
input data Excel file/s with exogenous data.
However, the method is also called within the 'update_database_and_problem'
method, which can be used in case some changes in exogenous data have been
made, so that the SQLite database and the problems can be updated without
re-generating the Model instance.
The user can choose to load data for all exogenous data tables, or for
specific data tables (with the 'table_key_list' attribute).
Args:
force_overwrite (bool, optional): Whether to force overwrite existing
data without asking for user permission. Defaults to False.
table_key_list (list[str], optional): A list of data table keys
for which to load exogenous data. If empty, all exogenous data
tables are loaded. Defaults to [].
"""
with self.logger.log_timing(
message=f"Loading input data to SQLite database...",
level='info',
):
self.core.database.load_data_input_files_to_database(
force_overwrite=force_overwrite,
table_key_list=table_key_list,
)
self.core.database.fill_nan_values_in_database(
force_overwrite=force_overwrite,
table_key_list=table_key_list,
)
def _initialize_problems(
self,
force_overwrite: bool = False,
allow_none_values: bool = True,
) -> None:
"""Initialize numerical problems in the Model instance.
This method intializes numerical problems in the Model instance.
Specifically, the method loads and validates symbolic mathematical problems,
checks if all exogenous data have coherently defined by user, and finally
generates numercal problem (i.e. initializes variables, feeds data to
exogenous variables, and generates cvxpy problem/s).
Args:
force_overwrite (bool, optional): If True, forces the overwrite
of existing numerical problems without asking for user
permission. Used for testing purposes. Defaults to False.
allow_none_values (bool, optional): If True, allows None values in
the exogenous data. Defaults to True.
"""
with self.logger.log_timing(
message=f"Numerical model generation...",
level='info',
):
self.core.load_and_validate_symbolic_problem(force_overwrite)
self.core.check_exogenous_data_coherence()
self.core.generate_numerical_problem(
allow_none_values, force_overwrite)
[docs]
def initialize_model_environment(self) -> None:
"""Initialize the model environment for problem generation and solution.
This method prepares the model environment by loading sets data and
coordinates, and initializing blank data structures (SQLite database and
input data files). This method is typically called after having generated
the Model instance, and before generating numerical problems and solving them.
If the 'use_existing_data' flag is set to True, this method is not meant to be
called, since sets data and coordinates are already loaded, and blank data
structures are not generated relying on existing ones.
Raises:
exc.SettingsError: If the sets Excel file specified in the settings
is missing when loading model coordinates.
"""
if self.settings['use_existing_data']:
self.logger.info(
"Relying on existing model environment (sets coordinates, "
"SQLite database, input data files)."
)
return
self._load_model_coordinates()
self._initialize_blank_data_structure()
[docs]
def refresh_database_and_initialize_problem(
self,
table_key_list: list[str] = [],
force_overwrite: bool = False,
) -> None:
"""Update SQLite database with exogenous data and initialize problems.
This method loads the SQLite database exogenous data, and then initializes
numerical problems.
This method can be used for both initialization of the model environment,
after having generated the Model instance, and for updating the model
environment and the problems in case some changes in input data have been
made, without the need of re-generating the Model instance.
Args:
table_key_list (list[str], optional): A list of data table keys
for which to load exogenous data. If empty, all exogenous data
tables are loaded. Defaults to [].
force_overwrite (bool, optional): Whether to overwrite/update
existing data without asking user permission. Defaults to False.
"""
sqlite_db_file = Defaults.ConfigFiles.SQLITE_DATABASE_FILE
self.logger.info(
f"Loading exogenous data into SQLite database '{sqlite_db_file}' "
"and initializing problems.")
self._load_exogenous_data_to_sqlite_database(
force_overwrite, table_key_list)
self._initialize_problems(force_overwrite)
[docs]
def run_model(
self,
force_overwrite: bool = False,
integrated_problems: bool = False,
convergence_monitoring: bool = True,
solver: Optional[str] = None,
solver_verbose: bool = False,
solver_settings: Optional[dict[str, Any]] = None,
convergence_norm: Defaults.LiteralTypes.NormType = 'l2',
convergence_tables_to_check: Defaults.LiteralTypes.ConvergenceTables | List[
str] = 'all_endogenous',
convergence_tables_to_skip: Optional[List[str]] = None,
relative_tolerance: Optional[float] = None,
maximum_iterations: Optional[int] = None,
keep_previous_iteration_db: bool = False,
**kwargs: Any,
) -> None:
"""Solve numerical problems defined by the model instance.
This method first performs some coherence checks (if solver is supported,
if numerical problems are defined, if integrated problems are possible).
Then, it solves the numerical problems, either independently or in an
integrated manner, based on the 'integrated_problems' flag.
Finally, it logs a summary of the problems status.
Args:
force_overwrite (bool, optional): If True, overwrites existing results.
Defaults to False.
integrated_problems (bool, optional): If True, solve problems iteratively
using a block Gauss-Seidel (alternating optimization) scheme, where
updated endogenous variables are exchanged until convergence.
Defaults to False.
convergence_monitoring (bool, optional): If True, enables convergence
monitoring during the solving of integrated problems. Defaults to True.
solver (str, optional): The solver to use for solving numerical
problems. Defaults to None, in which case the default solver
specified in 'Defaults.NumericalSettings.CVXPY_DEFAULT_SETTINGS' is used.
solver_verbose (bool, optional): If True, logs verbose output related to
numerical solver operation during the model run. Defaults to False.
solver_settings (dict[str, Any], optional): Additional settings
for the solver passed as key-value pairs. Defaults to None.
convergence_norm (Defaults.LiteralTypes.NormType, optional):
The norm type to use for convergence monitoring in integrated
problems. Defaults to 'l2' (Euclidean Norm).
convergence_tables_to_check (Defaults.LiteralTypes.ConvergenceTables |
List[str], optional): The data tables to consider for convergence
monitoring in integrated problems. Can be 'all_endogenous',
'hybrid_only', or a list of specific data table keys. Defaults
to 'all_endogenous'.
convergence_tables_to_skip (Optional[List[str]], optional): List of data table
keys to skip for convergence checking in integrated problems. If None,
no tables are skipped. Defaults to None.
relative_tolerance (float, optional): Numerical tolerance for verifying
maximum relative change between iterations in integrated problems for
each data table. Overrides 'Defaults.NumericalSettings.MODEL_COUPLING_SETTINGS'.
maximum_iterations (int, optional): The maximum number of iterations
for solving integrated problems. Overrides
'Defaults.NumericalSettings.MODEL_COUPLING_SETTINGS'.
keep_previous_iteration_db (bool, optional): Whether keep or not the database
generated during the last-1 iteration. For debugging purpose. Default to
False.
**kwargs: Additional keyword arguments to be passed to the solver. Useful
for setting solver-specific options.
Raises:
exc.SettingsError: In case solver is not supported by current cvxpy version.
exc.SettingsError: If no numerical problems are found, or if integrated
problems are requested but only one problem is found.
"""
cvxpy_defaults = Defaults.NumericalSettings.CVXPY_DEFAULT_SETTINGS
cvxpy_allowed_solvers = Defaults.NumericalSettings.ALLOWED_SOLVERS
sub_problems = self.core.problem.number_of_sub_problems
problem_scenarios = len(self.core.index.scenarios_info)
# Merge order: defaults < solver_settings < kwargs < explicit 'solver' arg
solver_config = {
**cvxpy_defaults,
**(solver_settings or {}),
**kwargs,
}
if solver is not None:
solver_config['solver'] = solver
selected_solver = solver_config.get('solver', cvxpy_defaults['solver'])
if selected_solver not in cvxpy_allowed_solvers:
msg = f"Solver '{selected_solver}' not supported by current CVXPY " \
f"version. Available solvers: {cvxpy_allowed_solvers}"
self.logger.error(msg)
raise exc.SettingsError(msg)
solver_settings = solver_config.copy()
solver_settings['solver'] = selected_solver
solver_settings['verbose'] = solver_verbose
if sub_problems == 0:
msg = "Numerical problem not found. Initialize problem first."
self.logger.error(msg)
raise exc.SettingsError(msg)
if integrated_problems and sub_problems == 1:
msg = "Only one problem found. Integrated problems not possible."
self.logger.error(msg)
raise exc.SettingsError(msg)
if integrated_problems and sub_problems > 1:
solution_type = 'integrated'
else:
solution_type = 'independent'
problem_count = '1' if sub_problems == 1 else f'{sub_problems}'
self.logger.info(
f"Model run | Solution mode: {solution_type}' | Solver: '{solver}' | "
f"Problems: {problem_count} | Scenarios: {problem_scenarios}")
if solver_verbose:
self.logger.info("Model run | CVXPY logs below")
with self.logger.log_timing(
message=f"Solving numerical problems...",
level='info',
):
self.core.solve_numerical_problems(
force_overwrite=force_overwrite,
integrated_problems=integrated_problems,
convergence_monitoring=convergence_monitoring,
convergence_norm=convergence_norm,
convergence_tables_to_check=convergence_tables_to_check,
convergence_tables_to_skip=convergence_tables_to_skip,
relative_tolerance=relative_tolerance,
maximum_iterations=maximum_iterations,
keep_previous_iteration_db=keep_previous_iteration_db,
**solver_settings,
)
msg = "Numerical problems status report:"
self.logger.info("="*len(msg))
self.logger.info(msg)
for info, status in self.core.problem.problem_status.items():
self.logger.info(
f"{info}: {status}" if info else f"{status}"
)
[docs]
def load_results_to_database(
self,
scenarios_idx: Optional[List[int] | int] = None,
force_overwrite: bool = False,
suppress_warnings: bool = False,
) -> None:
"""Export model results to the SQLite database.
This method exports the results of the numerical problems to the SQLite
database. It can export results for all scenarios or for specific scenarios
(defined as the linear combinations of inter-problem sets that identify
independent numerical problems), based on the 'scenarios_idx' attribute
Args:
scenarios_idx (Optional[List[int] | int], optional): A list of
scenario indices or a single scenario index for which to export
results. If None, results for all scenarios are exported. Defaults
to None.
force_overwrite (bool, optional): Whether to overwrite/update
existing data without asking user permission. Defaults to False.
suppress_warnings (bool, optional): Whether to suppress warnings
during the data loading process. Defaults to False.
"""
with self.logger.log_timing(
message=f"Exporting endogenous model results to SQLite database...",
level='info',
):
if not self.is_problem_solved:
self.logger.warning(
"Numerical problem has not solved yet and results "
"cannot be exported.")
return
self.core.cvxpy_endogenous_data_to_database(
scenarios_idx=scenarios_idx,
force_overwrite=force_overwrite,
suppress_warnings=suppress_warnings
)
[docs]
def reinitialize_sqlite_database(
self,
force_overwrite: bool = False
) -> None:
"""Reinitialize SQLite database tables and reimport input data.
This method reinitializes endogenous tables in SQLite database to Null
values, and reimports input data to exogenous tables.
Args:
force_overwrite (bool, optional): Whether to force overwrite
existing data. Used for testing purposes. Defaults to False.
"""
sqlite_db_file = Defaults.ConfigFiles.SQLITE_DATABASE_FILE
self.logger.info(
f"Reinitializing SQLite database '{sqlite_db_file}' "
"endogenous tables.")
self.core.database.reinit_sqlite_endogenous_tables(force_overwrite)
self._load_exogenous_data_to_sqlite_database(force_overwrite)
[docs]
def check_model_results(
self,
other_db_dir_path: Optional[Path | str] = None,
other_db_name: Optional[str] = None,
numerical_tolerance: Optional[float] = None,
) -> None:
"""Compare model SQLite database with another SQLite reference database.
This method compares the results of the model's SQLite database with those
of another SQLite database, typically for testing purposes. It uses the
'check_results_as_expected' method to compare the current model's computations
with the expected results. The expected results can be stored in a specific
database (identified by directory path and name), or stored in a test database
specified by the SQLite test database default name and located in the model
directory.
Both 'other_db_dir_path' and 'other_db_name' must be provided together, or both
must be None. If not provided, defaults are used.
Args:
other_db_dir_path (Optional[Path | str], optional): The directory path
where the other SQLite database is located. If None, it defaults
to the model directory. Defaults to None.
other_db_name (Optional[str], optional): The name of the other SQLite
database file. If None, it defaults to the SQLite test database
default name. Defaults to None.
numerical_tolerance (float, optional): The relative difference
(non-percentage) tolerance for comparing numerical values in
different databases. If None, it is set to
'Defaults.NumericalSettings.TOLERANCE_TESTS_RESULTS_CHECK'.
"""
if (other_db_dir_path is None) != (other_db_name is None):
msg = "Both 'other_db_dir_path' and 'other_db_name' parameters must " \
"be defined together, or both must be None."
self.logger.error(msg)
raise exc.SettingsError(msg)
if other_db_dir_path is None:
other_db_dir_path = self.paths['model_dir']
if other_db_name is None:
other_db_name = Defaults.ConfigFiles.SQLITE_DATABASE_FILE_TEST
if not numerical_tolerance:
numerical_tolerance = \
Defaults.NumericalSettings.TOLERANCE_TESTS_RESULTS_CHECK
with self.logger.log_timing(
message=f"Check model results...",
level='info',
):
self.core.compare_databases(
values_relative_diff_tolerance=numerical_tolerance,
other_db_dir_path=other_db_dir_path,
other_db_name=other_db_name,
)
[docs]
def update_sets_tables(
self,
set_keys_list: List[str] = [],
update_mode: Defaults.LiteralTypes.SetUpdateMode = 'all',
) -> None:
"""Update sets tables in the SQLite database.
This method updates sets tables in the SQLite database. The user can choose
to update all sets, or only specific sets (with the 'set_keys_list' attribute).
Additionally, the user can specify the update mode, which can be 'all',
'filters', or 'aggregations'.
Args:
set_keys_list (List[str], optional): A list of set keys to update.
If empty, all sets are updated. Defaults to [].
update_mode (Defaults.LiteralTypes.SetUpdateMode, optional):
The update mode. Can be 'all' (update all set data), 'filters'
(update only filters), or 'aggregations' (update only aggregations).
Defaults to 'all'.
"""
self.core.database.update_sets_in_sqlite_database(
set_keys_list=set_keys_list,
update_mode=update_mode,
)
[docs]
def variable(
self,
name: str,
scenario_key: Optional[int] = None,
intra_problem_key: Optional[int] = None,
if_hybrid_var: Defaults.LiteralTypes.HybridVarType = 'endogenous',
) -> Optional[pd.DataFrame]:
"""Fetch variable data.
This method retrieves the data for a specified variable based on optional
inter-problem and intra-problem sets cardinality, supporting the data
inspection process after a model has run, but before data has exported to the
database. This is particularly useful in case multiple runs of the model,
to facilitate the control of the numerical data from the user.
In case a variable is defined as both endogeous and exogenous, depending on
the numerical problem, the user can specify the one to inspect (default
as the endogenous one).
If the variable is specified for multiple inter- and intra-problem sets,
scenario_key defines the cardinality of inter-problem sets, while
intra_problem_key defines the cardinality of intra-problem sets.
Args:
name (str): The key of the variable in the variables dictionary.
scenario_key (Optional[int]): Defines the cardinality of inter-problem
sets. Default to None.
intra_problem_key (Optional[int]): Defines the cardinality of intra-problem
sets. Default to None.
if_hybrid_var (Defaults.LiteralTypes.HybridVarType): Defines the type
of variable data to inspect in case variable type depends on the
problem.
Returns:
Optional[pd.DataFrame]: The data for the specified variable.
"""
return self.core.index.fetch_variable_data(
var_key=name,
scenario_key=scenario_key,
intra_problem_key=intra_problem_key,
if_hybrid_var=if_hybrid_var,
)
[docs]
def set(self, name: str) -> Optional[pd.DataFrame]:
"""Fetch set data.
Useful for inspecting variables data during model generation and debugging.
Args:
name (str): The name of the set.
Returns:
Optional[pd.DataFrame]: The data for the specified set.
"""
return self.core.index.fetch_set_data(set_key=name)
def __repr__(self):
"""Return a string representation of the Model instance."""
class_name = type(self).__name__
return f'{class_name}'