Source code for ebm.model.filter_tek

import typing

import pandas as pd
from loguru import logger

from ebm.model.building_category import BuildingCategory
from ebm.model.data_classes import TEKParameters



[docs]
class FilterTek:
    """
    Utility class for filtering TEK lists and parameters. 
    """

    CATEGORY_APARTMENT = 'apartment_block'
    CATEGORY_HOUSE = 'house'
    COMMERCIAL_BUILDING = 'COM'
    RESIDENTIAL_BUILDING = 'RES'
    PRE_TEK49_APARTMENT = 'PRE_TEK49_RES_1950'
    PRE_TEK49_HOUSE = 'PRE_TEK49_RES_1940'


[docs]
    @staticmethod
    def get_filtered_list(building_category: BuildingCategory, building_code_list: typing.List[str]) -> typing.List[str]:
        """
        Filters the provided TEK list based on the building category.

        Parameters:
        - building_category (BuildingCategory): The category of the building.
        - building_code_list (List[str]): List of TEK strings to be filtered.

        Returns:
        - filtered_building_code_list (List[str]): Filtered list of TEK strings.
        """
        residential_building_list = [FilterTek.CATEGORY_APARTMENT, FilterTek.CATEGORY_HOUSE]
        
        if building_category in residential_building_list:
            # Filter out all TEKs associated with commercial buildings
            filtered_building_code_list = [tek for tek in building_code_list if FilterTek.COMMERCIAL_BUILDING not in tek]

            # Further filtering based on the specific residential building category
            if building_category == FilterTek.CATEGORY_APARTMENT:
                filtered_building_code_list = [tek for tek in filtered_building_code_list if tek != FilterTek.PRE_TEK49_HOUSE]
            elif building_category == FilterTek.CATEGORY_HOUSE:
                filtered_building_code_list = [tek for tek in filtered_building_code_list if tek != FilterTek.PRE_TEK49_APARTMENT]

        else:
            # Filter out all TEKs associated with residential buildings
            filtered_building_code_list = [tek for tek in building_code_list if FilterTek.RESIDENTIAL_BUILDING not in tek]

        return filtered_building_code_list

    
    # This method is only needed if building_code_params are initialized in the Buildings class

[docs]
    @staticmethod
    def get_filtered_params(building_code_list: typing.List[str],
                            building_code_params: typing.Dict[str, TEKParameters]) -> typing.Dict[str, TEKParameters]:
        """
        Filters the TEK parameters to include only those relevant to the provided TEK list.

        This method takes a dictionary of TEK parameters and filters it to include only 
        the parameters for TEKs that are present in the `building_code_list`. This ensures that 
        only the relevant TEK parameters are retained for use in subsequent calculations.

        Parameters:
        - building_code_list (List[str]): A list of TEK identifiers to filter by.
        - building_code_params (Dict[str, TEKParameters]): A dictionary where the keys are TEK identifiers 
                                                    and the values are TEKParameters objects containing
                                                    the parameters for each TEK.

        Returns:
        - filtered_building_code_params (Dict[str, TEKParameters]): A dictionary containing only the TEK parameters
                                                        for the TEKs present in the `building_code_list`.
        """
        filtered_building_code_params = {}
        for tek in building_code_list:
            filtered_building_code_params[tek] = building_code_params[tek]    

        return filtered_building_code_params



[docs]
    @staticmethod
    def merge_building_code(df: pd.DataFrame,
                  new_building_code_name: str,
                  old_building_code_names: typing.List[str],
                  aggregates: typing.Dict[str, str] = None) -> pd.DataFrame:
        """
        Merge rows in a DataFrame based on specified 'tek' names and aggregate their values.

        Parameters
        ----------
        df : pd.DataFrame
            The input DataFrame with a MultiIndex.
        new_building_code_name : str
            The new 'tek' name to assign to the merged rows.
        old_building_code_names : typing.List[str]
            A list of 'tek' names to be merged.
        aggregates : typing.Dict[str, str], optional
            A dictionary specifying the aggregation functions for each column.
            If not provided, default aggregations will be used:
            {'tek': 'max', 'm2': 'first', 'kwh_m2': 'mean', 'energy_requirement': 'sum'}.

        Returns
        -------
        pd.DataFrame
            The DataFrame with the specified 'tek' rows merged and aggregated.
        """
        if not isinstance(df, pd.DataFrame):
            raise ValueError("`df` should be a pandas DataFrame.")
        if not isinstance(old_building_code_names, list):
            raise ValueError("`old_building_code_names` should be a list of strings.")

        # Apply default aggregates if the parameter is empty
        aggregates = aggregates or {'building_code': 'max', 'm2': 'first', 'kwh_m2': 'mean', 'energy_requirement': 'sum'}
        building_code_values = [tek for tek in old_building_code_names if tek in df.index.get_level_values('building_code')]

        if not building_code_values:
            return df

        level_values = df.index.get_level_values('building_category')
        building_categories = [bc for bc in BuildingCategory if bc.is_residential() and bc in level_values]
        if not building_categories:
            return df

        residential = df.loc[
                (building_categories, slice(None), slice(None), slice(None), slice(None))].reset_index()

        building_code_to_merge = residential[residential.building_code.isin(building_code_values)]
        agg_building_code = building_code_to_merge.groupby(by=['building_category',
                                           'building_condition',
                                           'purpose',
                                           'year']).agg(aggregates)
        agg_building_code = agg_building_code.reset_index()

        agg_building_code['building_code'] = new_building_code_name
        rows_to_remove = df.loc[(slice(None), building_code_values, slice(None), slice(None), slice(None))].index
        df = df.drop(rows_to_remove)
        df = pd.concat([df, agg_building_code.set_index(['building_category', 'building_code', 'building_condition',  'year', 'purpose'])])
        df = df.sort_index()

        return df



[docs]
    @staticmethod
    def remove_building_code_suffix(df: pd.DataFrame, suffix) -> pd.DataFrame:
        # Convert MultiIndex to DataFrame
        index_df = df.index.to_frame(index=False)

        key_name = 'tek' if 'tek' in index_df.keys() else 'building_code'
        # Remove '_RES' from 'tek' values
        index_df[key_name] = index_df[key_name].str.replace(suffix, '')

        # Set the modified DataFrame back to MultiIndex
        df.index = pd.MultiIndex.from_frame(index_df)

        return df