Source code for gaiaxpy.cholesky.cholesky

"""
cholesky.py
====================================
Module that implements the Cholesky functionality.
"""
from pathlib import Path
from typing import Optional, Union

import numpy as np
import pandas as pd
from numpy import diag, dot, identity
from scipy.linalg import cholesky, solve_triangular

from gaiaxpy.core.generic_functions import parse_band
from gaiaxpy.core.satellite import BANDS
from gaiaxpy.input_reader.input_reader import InputReader


def __get_dot_product(_L_inv: np.ndarray) -> Optional[np.ndarray]:
    """
    Calculate the dot product of the transpose of L_inv with itself.

    Args:
        _L_inv (ndarray): A 2D numpy array.

    Returns:
        ndarray: The dot product of the transpose of L_inv with itself. None: If L_inv does not have the attribute `T`
            (transpose).
    """
    try:
        return dot(_L_inv.T, _L_inv)
    except AttributeError:
        return None


def __output_list_to_df(parsed_input_data: pd.DataFrame, bands_output: list, output_columns: list) -> pd.DataFrame:
    """
    Convert a list of output data into a pandas DataFrame.

    Args:
        parsed_input_data (pd.Dataframe): Parsed initial data.
        bands_output (list): A list of output data, where each element is a list of values for a specific band.
        output_columns (list): A list of strings representing the column names for the output DataFrame.

    Returns:
        pd.DataFrame: A DataFrame containing the source ID and the output data for each band.
    """
    output_list = [parsed_input_data['source_id']]
    for element in bands_output:
        output_list.append(element)
    return pd.DataFrame(zip(*output_list), columns=output_columns)


[docs] def get_inverse_square_root_covariance_matrix(input_object: Union[list, Path, str], band: Optional[str] = None): """ Compute the inverse square root covariance matrix. Args: input_object (list/Path/str): Path to the file containing the mean spectra as downloaded from the archive in their continuous representation, a pandas DataFrame, a list of sources ids (string or long), or an ADQL query. band (str): Chosen band: 'bp' or 'rp'. If no band is passed, the function will compute the inverse square root covariance for both 'bp' and 'rp'. Returns: DataFrame or ndarray: DataFrame containing the source IDs and the output inverse square root covariance matrices for the sources in the input object if it contains more than one source or no band is passed to the function. The function will return a ndarray (of shape (55, 55)) if there is only one source ID in the input data and a single band is selected. """ if band is not None: band = parse_band(band) parsed_input_data, extension = InputReader(input_object, get_inverse_square_root_covariance_matrix, False).read() if band is None: bands_to_process = BANDS output_columns = ['source_id', 'bp_inverse_square_root_covariance_matrix', 'rp_inverse_square_root_covariance_matrix'] else: bands_to_process = [band] output_columns = ['source_id', f'{band}_inverse_square_root_covariance_matrix'] bands_output = [] for b in bands_to_process: xp_errors = parsed_input_data[f'{b}_coefficient_errors'] / parsed_input_data[f'{b}_standard_deviation'] xp_correlation_matrix = parsed_input_data[f'{b}_coefficient_correlations'] band_inv_iterable = map(_get_inverse_square_root_covariance_matrix_aux, xp_errors, xp_correlation_matrix) bands_output.append(band_inv_iterable) output_df = __output_list_to_df(parsed_input_data, bands_output, output_columns) if len(bands_to_process) == 1 and len(output_df) == 1: return output_df[f'{band}_inverse_square_root_covariance_matrix'].iloc[0] else: return output_df
def _get_inverse_square_root_covariance_matrix_aux(xp_errors: np.ndarray, xp_correlation_matrix: np.ndarray) -> \ Optional[np.ndarray]: """ Calculate the inverse square root of the covariance matrix. Args: xp_errors (ndarray): A numpy array representing the measurement errors. xp_correlation_matrix (ndarray): A numpy array representing the correlation matrix. Returns: ndarray: The inverse square root of the covariance matrix. None: If the Cholesky decomposition of the correlation matrix fails. """ try: _L = cholesky(xp_correlation_matrix, lower=True) # Invert lower triangular matrix _L_inv = solve_triangular(_L, identity(len(_L)), lower=True) # Matrix of inverse errors _E_inv = diag(1.0 / xp_errors) return dot(_L_inv, _E_inv) except ValueError: return None
[docs] def get_inverse_covariance_matrix(input_object: Union[list, Path, str], band: Optional[str] = None): """ Compute the inverse covariance matrix. Args: input_object (object): Path to the file containing the mean spectra as downloaded from the archive in their continuous representation, a pandas DataFrame, a list of sources ids (string or long), or an ADQL query. band (str): Chosen band: 'bp' or 'rp'. If no band is passed, the function will compute the inverse covariance for both 'bp' and 'rp'. Returns: DataFrame or ndarray: DataFrame containing the source IDs and the output inverse covariance matrices for the sources in the input object if it contains more than one source or no band is passed to the function. The function will return a ndarray (of shape (55, 55)) if there is only one source ID in the input data and a single band is selected. """ band = band if band is None else parse_band(band) parsed_input_data, extension = InputReader(input_object, get_inverse_covariance_matrix, False).read() bands_output = [] if band is None: bands_to_process = BANDS output_columns = ['source_id', 'bp_inverse_covariance', 'rp_inverse_covariance'] else: bands_to_process = [band] output_columns = ['source_id', f'{band}_inverse_covariance'] for b in bands_to_process: # The formal errors need to be scaled by the inverse standard deviation. xp_errors = parsed_input_data[f'{b}_coefficient_errors'] / parsed_input_data[f'{b}_standard_deviation'] xp_correlation_matrix = parsed_input_data[f'{b}_coefficient_correlations'] _L_inv_iterable = map(_get_inverse_square_root_covariance_matrix_aux, xp_errors, xp_correlation_matrix) band_output = map(__get_dot_product, _L_inv_iterable) bands_output.append(band_output) output_df = __output_list_to_df(parsed_input_data, bands_output, output_columns) if len(bands_to_process) == 1 and len(output_df) == 1: return output_df[f'{band}_inverse_covariance'].iloc[0] else: return output_df
[docs] def get_chi2(_L_inv: np.ndarray, residuals: np.ndarray) -> np.ndarray: """ Compute chi-squared (chi2) from given inverse Cholesky of the covariance matrix (L^-1) and a residual vector (r = data - model). This function defines x = L^-1 * r such that chi2 = |x|^2, which guarantees that chi2 >= 0. Args: _L_inv (ndarray): Inverse square root of the covariance, as computed from the function get_inverse_square_root_covariance_matrix. residuals (ndarray): Difference between the observed coefficient vector and some model prediction of it. Returns: float: Chi-squared value. """ if _L_inv is None or residuals is None: raise ValueError('Input parameters cannot be None.') if _L_inv.shape != (55, 55): raise ValueError('Inverse covariance matrix shape must be (55, 55).') if residuals.shape != (55,): raise ValueError('Residuals shape must be (55,).') x = dot(_L_inv, residuals) return dot(x.T, x)