Source code for citylearn.end_use_load_profiles.neighborhood

import concurrent.futures
from copy import deepcopy
import os
from enum import Enum, unique
from pathlib import Path
import random
import shutil
from typing import Any, Callable, List, Mapping, Tuple, Union
from doe_xstock.data import VersionDatasetType
from doe_xstock.end_use_load_profiles import EndUseLoadProfiles
from doe_xstock.simulate import EndUseLoadProfilesEnergyPlusSimulator, OpenStudioModelEditor
import numpy as np
import pandas as pd
from sklearn.metrics import mean_squared_error, mean_absolute_percentage_error
import torch
from citylearn.agents.base import Agent, BaselineAgent
from citylearn.base import Environment
from citylearn.building import Building
from citylearn.citylearn import CityLearnEnv
from citylearn.data import get_settings
from citylearn.dynamics import LSTMDynamics
from citylearn.end_use_load_profiles.clustering import MetadataClustering
from citylearn.end_use_load_profiles.lstm_model.model_generation_wrapper import run_one_model
from citylearn.end_use_load_profiles.simulate import EndUseLoadProfilesEnergyPlusPartialLoadSimulator
from citylearn.preprocessing import PeriodicNormalization, Normalize
from citylearn.utilities import read_json, write_json

BuildingSimulators = Mapping[
    str, 
    Union[EndUseLoadProfilesEnergyPlusSimulator, EndUseLoadProfilesEnergyPlusSimulator, List[EndUseLoadProfilesEnergyPlusPartialLoadSimulator]]
]
BuildingsSimulators = List[BuildingSimulators]

[docs] @unique class SampleMethod(Enum): RANDOM = 0 METADATA_CLUSTER_FREQUENCY = 1
[docs] class NeighborhoodBuild: def __init__( self, schema_filepath: Path, citylearn_simulation_test_evaluation: pd.DataFrame, citylearn_simulation_lstm_prediction_data: Mapping[int, pd.DataFrame], citylearn_simulation_lstm_error_data: Mapping[int, pd.DataFrame], lstm_test_data: Mapping[int, pd.DataFrame], bldg_ids: List[int], sample_cluster_labels: List[int], sample_metadata: Mapping[str, Any], simulators: BuildingsSimulators ): self.__schema_filepath = schema_filepath self.__citylearn_simulation_test_evaluation = citylearn_simulation_test_evaluation self.__citylearn_simulation_lstm_prediction_data = citylearn_simulation_lstm_prediction_data self.__citylearn_simulation_lstm_error_data = citylearn_simulation_lstm_error_data self.__lstm_test_data = lstm_test_data self.__bldg_ids = bldg_ids self.__sample_cluster_labels = sample_cluster_labels self.__sample_metadata = sample_metadata self.__simulators = simulators @property def schema_filepath(self) -> Path: return self.__schema_filepath @property def citylearn_simulation_test_evaluation(self) -> pd.DataFrame: return self.__citylearn_simulation_test_evaluation @property def citylearn_simulation_lstm_prediction_data(self) -> List[pd.DataFrame]: return self.__citylearn_simulation_lstm_prediction_data @property def citylearn_simulation_lstm_error_data(self) -> List[pd.DataFrame]: return self.__citylearn_simulation_lstm_error_data @property def lstm_test_data(self) -> List[pd.DataFrame]: return self.__lstm_test_data @property def bldg_ids(self) -> List[int]: return self.__bldg_ids @property def sample_cluster_labels(self) -> List[int]: return self.__sample_cluster_labels @property def sample_metadata(self) -> Mapping[str, Any]: return self.__sample_metadata @property def simulators(self) -> BuildingsSimulators: return self.__simulators
[docs] class Neighborhood: __BUILDING_TYPE_COLUMN = 'in.geometry_building_type_recs' __SINGLE_FAMILY_BUILDING_TYPE_NAME = 'Single-Family Detached' __COUNTY_COLUMN = 'in.resstock_county_id' def __init__( self, weather_data: str = None, year_of_publication: int = None, release: int = None, cache: bool = None, energyplus_output_directory: Union[Path, str] = None, dataset_directory: Union[Path, str] = None, max_workers: int = None, random_seed: int = None ) -> None: self.__end_use_load_profiles = EndUseLoadProfiles( dataset_type=VersionDatasetType.RESSTOCK, weather_data=weather_data, year_of_publication=year_of_publication, release=release, cache=cache, ) self.energyplus_output_directory = energyplus_output_directory self.dataset_directory = dataset_directory self.max_workers = max_workers self.random_seed = random_seed @property def end_use_load_profiles(self) -> EndUseLoadProfiles: return self.__end_use_load_profiles @property def energyplus_output_directory(self) -> Union[Path, str]: return self.__energyplus_output_directory @property def dataset_directory(self) -> Union[Path, str]: return self.__dataset_directory @property def max_workers(self) -> int: return self.__max_workers @property def random_seed(self) -> int: return self.__random_seed @energyplus_output_directory.setter def energyplus_output_directory(self, value: Union[Path, str]): self.__energyplus_output_directory = 'neighborhood_energyplus_output' if value is None else value @dataset_directory.setter def dataset_directory(self, value: Union[Path, str]): self.__dataset_directory = 'neighborhood_datasets' if value is None else value @max_workers.setter def max_workers(self, value: int): self.__max_workers = value @random_seed.setter def random_seed(self, value: int): self.__random_seed = random.randint(*Environment.DEFAULT_RANDOM_SEED_RANGE) if value is None else value
[docs] def build( self, idd_filepath: Union[Path, str], bldg_ids: List[int] = None, include_lstm_models: bool = None, test_lstm_models: bool = None, test_citylearn_simulation: bool = None, delete_energyplus_simulation_output: bool = None, sample_buildings_kwargs: Mapping[str, Any] = None, energyplus_simulation_kwargs: Mapping[str, Any] = None, train_lstm_kwargs: Mapping[str, Any] = None, schema_kwargs: Mapping[str, Any] = None, test_citylearn_simulation_kwargs: Mapping[str, Any] = None ) -> NeighborhoodBuild: sample_buildings_kwargs = {} if sample_buildings_kwargs is None else sample_buildings_kwargs energyplus_simulation_kwargs = {} if energyplus_simulation_kwargs is None else energyplus_simulation_kwargs train_lstm_kwargs = {} if train_lstm_kwargs is None else train_lstm_kwargs schema_kwargs = {} if schema_kwargs is None else schema_kwargs test_citylearn_simulation_kwargs = {} if test_citylearn_simulation_kwargs is None else test_citylearn_simulation_kwargs include_lstm_models = True if include_lstm_models is None else include_lstm_models test_citylearn_simulation = True if test_citylearn_simulation is None else test_citylearn_simulation test_lstm_models = True if test_lstm_models is None else test_lstm_models delete_energyplus_simulation_output = False if delete_energyplus_simulation_output is None else delete_energyplus_simulation_output labels = None sample_metadata = None simulators = None lstm_training_data = None lstm_models = None schema_filepath = None citylearn_simulation_evaluation = None citylearn_simulation_lstm_prediction_data = None citylearn_simulation_lstm_error_data = None lstm_test_data = None # sample buildings if bldg_ids is None: bldg_ids, labels, sample_metadata = self.sample_buildings(**sample_buildings_kwargs) else: pass # run energyplus simulations simulators = self.simulate_energy_plus(bldg_ids, idd_filepath, **energyplus_simulation_kwargs) # train LSTM models if include_lstm_models: lstm_training_data = self.get_lstm_training_data(simulators) lstm_models = self.train_lstm(lstm_training_data, **train_lstm_kwargs) else: pass # generate schema schema_filepath = self.set_schema(simulators, bldg_ids, lstm_models=lstm_models, **schema_kwargs) # confirm schema initializes correctly in CityLearn and simulation completes without errors if test_citylearn_simulation: citylearn_simulation_evaluation, citylearn_simulation_lstm_prediction_data, citylearn_simulation_lstm_error_data \ = self.test_citylearn_simulation(schema_filepath, **test_citylearn_simulation_kwargs) else: pass # run test on generated LSTM training data for all partial load simulation references if include_lstm_models and test_lstm_models: lstm_test_data = self.multiprocess_test_lstm(lstm_training_data, schema_filepath) else: pass # delete energyplus output files to save space if delete_energyplus_simulation_output: self.delete_energyplus_simulation_output(simulators) else: pass return NeighborhoodBuild( schema_filepath=schema_filepath, citylearn_simulation_test_evaluation=citylearn_simulation_evaluation, citylearn_simulation_lstm_prediction_data=citylearn_simulation_lstm_prediction_data, citylearn_simulation_lstm_error_data=citylearn_simulation_lstm_error_data, lstm_test_data=lstm_test_data, bldg_ids=bldg_ids, sample_cluster_labels=labels, sample_metadata=sample_metadata, simulators=simulators )
[docs] def delete_energyplus_simulation_output(self, simulators: BuildingsSimulators): directories = [Path(s['ideal'].output_directory).parents[0] for s in simulators] for d in directories: if os.path.isdir(d): shutil.rmtree(d) else: pass
[docs] def multiprocess_test_lstm(self, training_data: List[pd.DataFrame], schema_filepath: Path) -> List[pd.DataFrame]: test_data = [None]*len(training_data) with concurrent.futures.ProcessPoolExecutor(max_workers=self.max_workers) as executor: results = [executor.submit( self.test_lstm, *(i, td.copy(), schema_filepath) ) for i, td in enumerate(training_data)] for future in concurrent.futures.as_completed(results): result = future.result() test_data[result[0]] = result[1] return test_data
[docs] def test_lstm(self, bldg_ix: int, training_data: pd.DataFrame, schema_filepath: Path) -> Tuple[int, pd.DataFrame]: # set data schema = read_json(schema_filepath) schema_directory = Path(schema_filepath).parents[0] bldg_key = list(schema['buildings'].keys())[bldg_ix] dynamics_model = schema['buildings'][bldg_key]['dynamics'] normalization_minimum = dynamics_model['attributes']['input_normalization_minimum'] normalization_maximum = dynamics_model['attributes']['input_normalization_maximum'] observation_names = dynamics_model['attributes']['input_observation_names'] periodic_observations = Building.get_periodic_observation_metadata() training_data = training_data.sort_values(['reference', 'timestep']) # type cast columns = [c for c in observation_names + list(periodic_observations.keys()) if not c.endswith('_sin') and not c.endswith('_cos')] training_data[columns] = training_data[columns].astype('float32') ## cyclic normalization for c, m in periodic_observations.items(): result = training_data[c]*PeriodicNormalization(x_max=m[-1]) result = pd.DataFrame(result.tolist(), index=result.index) training_data[f'{c}_sin'] = result[0].tolist() training_data[f'{c}_cos'] = result[1].tolist() input_columns = [] # then normalize all columns between 0 and 1 including the cyclic columns for i, c in enumerate(observation_names): input_columns.append(f'{c}_norm') training_data[input_columns[-1]] = training_data[c]*Normalize(normalization_minimum[i], normalization_maximum[i]) training_data[input_columns] = training_data[input_columns].astype('float32') independent_columns = input_columns[:-1] dependent_column = input_columns[-1] # initialize trained model model = LSTMDynamics( os.path.join(schema_directory, dynamics_model['attributes']['filename']), observation_names, normalization_minimum, normalization_maximum, hidden_size=dynamics_model['attributes']['hidden_size'], num_layers=dynamics_model['attributes']['num_layers'], lookback=dynamics_model['attributes']['lookback'] ) # make predictions data_list = [] for _, reference_data in training_data.groupby('reference'): reference_data = reference_data.reset_index(drop=True) model.reset() for i in range(model.lookback, reference_data.shape[0]): x_independent = reference_data[independent_columns].iloc[i - model.lookback + 1:i + 1].values x_dependent = reference_data[[dependent_column]].iloc[i - model.lookback:i].values x = np.append(x_independent, x_dependent, axis=1) x = torch.tensor(x.copy()) x = x[np.newaxis, :, :] hidden_state = tuple([h.data for h in model._hidden_state]) y, model._hidden_state = model(x.float(), hidden_state) y = y.item() reference_data.loc[i, dependent_column] = y predicted_column = dependent_column.replace('norm', 'predicted') actual_column = dependent_column.replace('_norm', '') norm_min = normalization_minimum[-1] norm_max = normalization_maximum[-1] reference_data[predicted_column] = reference_data[dependent_column]*(norm_max - norm_min) + norm_min reference_data = reference_data[['timestep', 'reference', 'reference_name', actual_column, predicted_column]].copy() data_list.append(reference_data) return bldg_ix, pd.concat(data_list, ignore_index=True)
[docs] def test_citylearn_simulation( self, schema: Path, model: Agent = None, env_kwargs: Mapping[str, Any] = None, model_kwargs: Mapping[str, Any] = None, report_lstm_performance: bool = None ) -> Tuple[pd.DataFrame, List[pd.DataFrame], List[pd.DataFrame]]: report_lstm_performance = True if report_lstm_performance is None else report_lstm_performance env_kwargs = {} if env_kwargs is None else env_kwargs model_kwargs = {} if model_kwargs is None else model_kwargs # test initialization env = CityLearnEnv(schema, **env_kwargs) model = BaselineAgent if model is None else model model = model(env=env, **model_kwargs) observations, _ = env.reset() # test stepping while not env.terminated: actions = model.predict(observations) observations, _, _, _, _ = env.step(actions) evaluation = env.evaluate() if report_lstm_performance: lstm_prediction_data: List[pd.DataFrame] = [] lstm_error_data: List[pd.DataFrame] = [] for b in env.buildings: lstm_prediction_data.append(pd.DataFrame({ 'hour': b.energy_simulation.hour, 'month': b.energy_simulation.month, 'indoor_dry_bulb_temperature': b.energy_simulation.indoor_dry_bulb_temperature_without_control, 'indoor_dry_bulb_temperature_predicted': b.indoor_dry_bulb_temperature, })) rmse_data = lstm_prediction_data[-1].groupby(['month'])[['indoor_dry_bulb_temperature','indoor_dry_bulb_temperature_predicted']].apply( lambda x: mean_squared_error(x['indoor_dry_bulb_temperature'], x['indoor_dry_bulb_temperature_predicted'] )).reset_index(name='rmse') rmse_data['rmse'] = rmse_data['rmse']**0.5 mape_data = lstm_prediction_data[-1].groupby(['month'])[['indoor_dry_bulb_temperature','indoor_dry_bulb_temperature_predicted']].apply( lambda x: mean_absolute_percentage_error(x['indoor_dry_bulb_temperature'], x['indoor_dry_bulb_temperature_predicted'] )).reset_index(name='mape') mape_data['mape'] = mape_data['mape']*100.0 error_data = rmse_data.merge(mape_data, on=['month']) error_data.insert(0, 'bldg_name', b.name) lstm_error_data.append(error_data) else: lstm_prediction_data = None lstm_error_data = None return evaluation, lstm_prediction_data, lstm_error_data
[docs] def set_schema( self, simulators: BuildingsSimulators, bldg_ids: List[int], lstm_models: List[Mapping[str, Any]] = None, pricing: Union[List[Union[Path, pd.DataFrame, str]], Path, pd.DataFrame, str] = None, carbon_intensity: List[Union[Path, pd.DataFrame, str]] = None, template: Mapping[str, Union[dict, float, int, str]] = None, metadata: pd.DataFrame = None, dataset_name: str = None, schema_directory: Union[Path, str] = None, weather_kwargs: dict = None, user_customization_function: Callable[[dict], dict] = None ) -> Path: assert pricing is None or not isinstance(pricing, list) or len(pricing) == len(bldg_ids), \ 'There must be as many pricing as bldg_ids.' assert carbon_intensity is None or not isinstance(carbon_intensity, list) or len(carbon_intensity) == len(bldg_ids), \ 'There must be as many carbon_intensity as bldg_ids.' template = get_settings()['schema']['template'] if template is None else template lstm_models = [None]*len(simulators) if lstm_models is None else lstm_models metadata = self.end_use_load_profiles.metadata.metadata.get().to_dict('index') if metadata is None else metadata schema_directory = self.dataset_directory if schema_directory is None else schema_directory county = metadata[list(metadata.keys())[0]][self.__COUNTY_COLUMN] county = county.lower().replace(',', '').replace(' ', '_') dataset_name = f'{self.end_use_load_profiles.version}-{county}' if dataset_name is None else dataset_name weather_kwargs = {} if weather_kwargs is None else weather_kwargs building_template = template.pop('buildings')['Building_1'] template['buildings'] = {} schema_directory = os.path.join(schema_directory, dataset_name) os.makedirs(schema_directory, exist_ok=True) # write weather (csv and epw) reference_simulator = simulators[0]['partial'][0] weather_data = self.get_weather_data(reference_simulator, **weather_kwargs) weather_filename = building_template['weather'] if building_template['weather'] is not None else 'weather.csv' weather_data.to_csv(os.path.join(schema_directory, weather_filename), index=False) _ = shutil.copy(reference_simulator.epw_filepath, os.path.join(schema_directory, weather_filename.replace('.csv', '.epw'))) for i, (bldg_id, building_simulators, lstm_model) in enumerate(zip(bldg_ids, simulators, lstm_models)): bldg_key = '-'.join(building_simulators['ideal'].simulation_id.split('-')[:-1]) simulator: EndUseLoadProfilesEnergyPlusPartialLoadSimulator = building_simulators['partial'][0] ideal_simulator: EndUseLoadProfilesEnergyPlusSimulator = building_simulators['ideal'] building = deepcopy(building_template) no_lstm_model = True if lstm_model is None else False # set building data building_data_query_filepath = os.path.join(simulator.QUERIES_DIRECTORY, 'select_citylearn_energy_simulation.sql') building_data = simulator.get_output_database().query_table_from_file(building_data_query_filepath) building_data_ideal = ideal_simulator.get_output_database().query_table_from_file(building_data_query_filepath) building_data['indoor_dry_bulb_temperature_cooling_set_point'] = building_data_ideal['indoor_dry_bulb_temperature_cooling_set_point'].tolist() building_data['indoor_dry_bulb_temperature_heating_set_point'] = building_data_ideal['indoor_dry_bulb_temperature_heating_set_point'].tolist() # set building-specific filepaths building['energy_simulation'] = f'{bldg_key}.csv' building['pricing'], building['carbon_intensity'] = self.__get_building_pricing_and_carbon_intensity( bldg_key, i, building_template, schema_directory, pricing, carbon_intensity) # as-modeled DER survey no_space_cooling = building_data['cooling_demand'].sum() == 0 no_space_heating = building_data['heating_demand'].sum() == 0 no_dhw_heating = building_data['dhw_demand'].sum() == 0 no_electric_dhw_heating = metadata[bldg_id]['in.water_heater_fuel'] != 'Electricity' no_dhw_heating_storage = True if no_electric_dhw_heating else False if no_space_cooling: building['cooling_device'] = None building['inactive_observations'] += [o for o in template['observations'] if 'cooling' in o] else: pass if no_space_heating: building['heating_device'] = None building['inactive_observations'] += [o for o in template['observations'] if 'heating' in o] else: pass if no_dhw_heating: building['dhw_device'] = None building['dhw_storage'] = None building['inactive_observations'] += [o for o in template['observations'] if 'dhw' in o] building['inactive_actions'] += ['dhw_storage'] elif no_dhw_heating_storage: building['dhw_storage'] = None building['inactive_observations'] += [o for o in template['observations'] if 'dhw_storage' in o] building['inactive_actions'] += ['dhw_storage'] else: pass # PV autosize attributes osm = OpenStudioModelEditor(self.end_use_load_profiles.get_building(bldg_id).open_studio_model.get()) building['pv']['autosize_attributes'] = { **building['pv']['autosize_attributes'], 'roof_area': round(osm.get_roof_area(), 2), } # dynamics model if no_lstm_model: building['dynamics'] = None building['type'] = 'citylearn.building.Building' else: building['dynamics']['attributes']['filename'] = f'{bldg_key}.pth' building['dynamics']['attributes']['hidden_size'] = lstm_model['attributes']['hidden_size'] building['dynamics']['attributes']['num_layers'] = lstm_model['attributes']['num_layers'] building['dynamics']['attributes']['lookback'] = lstm_model['attributes']['lookback'] building['dynamics']['attributes']['input_observation_names'] = lstm_model['attributes']['input_observation_names'] building['dynamics']['attributes']['input_normalization_minimum'] = lstm_model['attributes']['input_normalization_minimum'] building['dynamics']['attributes']['input_normalization_maximum'] = lstm_model['attributes']['input_normalization_maximum'] torch.save( lstm_model['model'].state_dict(), os.path.join(schema_directory, building['dynamics']['attributes']['filename']) ) # set building schema template['buildings'][bldg_key] = building # write back data file building_data = building_data.astype('float32') for c in ['hour', 'month', 'daylight_savings_status', 'hvac_mode', 'day_type']: if c in building_data.columns: building_data[c] = building_data[c].astype('int32') else: pass building_data.to_csv(os.path.join(schema_directory, building['energy_simulation']), index=False) schema_filepath = os.path.join(schema_directory, f'schema.json') template = user_customization_function(template) if user_customization_function is not None else template write_json(schema_filepath, template) return schema_filepath
def __get_building_pricing_and_carbon_intensity( self, bldg_key: str, bldg_ix: int, building_template: Mapping[str, Union[dict, float, int, str]], schema_directory: Union[str, Path], pricing: Union[List[Union[Path, pd.DataFrame, str]], Path, pd.DataFrame, str] = None, carbon_intensity: Union[List[Union[Path, pd.DataFrame, str]], Path, pd.DataFrame, str] = None ) -> Tuple[str, str]: data = dict( pricing=dict( default_filename=building_template['pricing'] if building_template['pricing'] is not None else 'pricing.csv', data=pricing, schema_filename=None ), carbon_intensity=dict( default_filename=building_template['carbon_intensity'] if building_template['carbon_intensity'] is not None else 'carbon_intensity.csv', data=carbon_intensity, schema_filename=None ) ) for k, v in data.items(): if v['data'] is None: if os.path.isfile(os.path.join(schema_directory, v['default_filename'])): data[k]['schema_filename'] = v['default_filename'] else: pass elif isinstance(v['data'], (Path, str)): destination_filepath = os.path.join(schema_directory, v['default_filename']) shutil.copy(v['data'], destination_filepath) data[k]['schema_filename'] = v['default_filename'] elif isinstance(v['data'], pd.DataFrame): destination_filepath = os.path.join(schema_directory, v['default_filename']) v['data'].to_csv(destination_filepath, index=False) data[k]['schema_filename'] = v['default_filename'] elif isinstance(v['data'], list): destination_filename = f'{bldg_key}-pricing.csv' data[k]['schema_filename'] = destination_filename destination_filepath = os.path.join(schema_directory, destination_filename) if isinstance(v['data'][bldg_ix], (Path, str)): shutil.copy(v['data'][bldg_ix], destination_filepath) elif isinstance(v['data'][bldg_ix], pd.DataFrame): v['data'][bldg_ix].to_csv(destination_filepath, index=False) else: raise ValueError(f'Invalid {k} value type: {type(v["data"])}') return data['pricing']['schema_filename'], data['carbon_intensity']['schema_filename']
[docs] def get_weather_data(self, simulator: EndUseLoadProfilesEnergyPlusPartialLoadSimulator, shifts: Tuple[int, int, int] = None, accuracy: Mapping[str, Tuple[float, float, float]] = None) -> pd.DataFrame: database = simulator.get_output_database() query_filepath = os.path.join(simulator.QUERIES_DIRECTORY, 'select_citylearn_weather.sql') data = database.query_table_from_file(query_filepath) columns = data.columns shifts = (6, 12, 24) if shifts is None else shifts accuracy = {c: (0.3, 0.65, 1.35) if c == 'outdoor_dry_bulb_temperature' else (0.025, 0.05, 0.1) for c in columns} \ if accuracy is None else accuracy for c in columns: for i, (s, a) in enumerate(zip(shifts, accuracy[c])): arr = np.roll(data[c], shift=-s) nprs = np.random.RandomState(self.random_seed) shift_column = f'{c}_predicted_{int(i + 1)}' if c in ['outdoor_dry_bulb_temperature']: data[shift_column] = arr + nprs.uniform(-a, a, len(arr)) elif c in ['outdoor_relative_humidity', 'diffuse_solar_irradiance', 'direct_solar_irradiance']: data[shift_column] = arr + arr*nprs.uniform(-a, a, len(arr)) else: raise Exception(f'Unknown field: {c}') if c != 'outdoor_dry_bulb_temperature': data[shift_column] = data[shift_column].clip(lower=0.0) if c == 'outdoor_relative_humidity': data[shift_column] = data[shift_column].clip(upper=100.0) else: pass else: pass data = data.astype('float32') return data
[docs] def train_lstm(self, data: List[pd.DataFrame], config: Mapping[str, Any] = None, seed: int = None) -> List[Mapping[str, Any]]: seed = self.random_seed if seed is None else seed config = get_settings()['lstm']['train']['config'] if config is None else config data = [run_one_model(config, d.copy(), seed) for d in data] return data
[docs] def get_lstm_training_data(self, simulators: BuildingsSimulators) -> List[pd.DataFrame]: data = [] for building_simulators in simulators: data_list = [] for partial_simulator in building_simulators['partial']: partial_simulator: EndUseLoadProfilesEnergyPlusPartialLoadSimulator query_filepath = os.path.join(EndUseLoadProfilesEnergyPlusPartialLoadSimulator.QUERIES_DIRECTORY, 'select_lstm_training_data.sql') pdata = partial_simulator.get_output_database().query_table_from_file(query_filepath) pdata.insert(0, 'reference_name', partial_simulator.simulation_id.split('-')[-2]) pdata.insert(0, 'reference', int(partial_simulator.simulation_id.split('-')[-1])) data_list.append(pdata) data.append(pd.concat(data_list, ignore_index=True)) return data
[docs] def simulate_energy_plus( self, bldg_ids: List[int], idd_filepath: Union[Path, str], simulation_ids: List[str] = None, models: List[Union[Path, str]] = None, schedules: List[Union[Path, pd.DataFrame]] = None, thermostat_setpoints: List[Union[Path, pd.DataFrame]] = None, fixed_ideal_loads_idf: List[Union[Path, str]] = None, osm: bool = None, partial_loads_simulations: int = None, simulate_mechanical: bool = None, delete_existing_simulation: bool = None, partial_loads_kwargs: Mapping[str, Any] = None, **kwargs ) -> BuildingsSimulators: assert models is None or len(models) == len(bldg_ids), 'There must be as many models as bldg_ids.' assert schedules is None or len(schedules) == len(bldg_ids), 'There must be as many schedules as bldg_ids.' assert thermostat_setpoints is None or len(thermostat_setpoints) == len(bldg_ids), 'There must be as many thermostat_setpoints as bldg_ids.' assert fixed_ideal_loads_idf is None or len(fixed_ideal_loads_idf) == len(bldg_ids), 'There must be as many fixed_ideal_loads_idf as bldg_ids.' assert simulation_ids is None or len(simulation_ids) == len(bldg_ids), 'There must be as many simulation_ids as bldg_ids.' os.makedirs(self.energyplus_output_directory, exist_ok=True) partial_loads_simulations = 4 if partial_loads_simulations is None else partial_loads_simulations simulate_mechanical = True if simulate_mechanical is None else simulate_mechanical delete_existing_simulation = True if delete_existing_simulation is None else delete_existing_simulation partial_loads_kwargs = {} if partial_loads_kwargs is None else partial_loads_kwargs simulators = [] kwargs = dict( idd_filepath=idd_filepath, osm=osm, **kwargs, number_of_time_steps_per_hour=1 if kwargs.get('number_of_time_steps_per_hour', None) is None else kwargs['number_of_time_steps_per_hour'] ) if ( kwargs.get('default_output_variables', None) is None or not kwargs['default_output_variables'] ) and kwargs.get('output_variables', None) is None: kwargs['default_output_variables'] = True else: pass if ( kwargs.get('default_output_meters', None) is None or not kwargs['default_output_meters'] ) and kwargs.get('output_meters', None) is None: kwargs['default_output_meters'] = True else: pass for i, bldg_id in enumerate(bldg_ids): bldg_id_ix = bldg_ids[:i].count(bldg_id) simulation_id = f'{self.end_use_load_profiles.version}-{bldg_id}-{bldg_id_ix}' if simulation_ids is None else simulation_ids[i] output_directory = os.path.join(self.energyplus_output_directory, simulation_id) if os.path.isdir(output_directory) and delete_existing_simulation: shutil.rmtree(output_directory) else: pass os.makedirs(output_directory) _kwargs = dict( **kwargs, bldg_id=bldg_id, model=models[i] if models is not None else models, schedules=schedules[i] if schedules is not None else schedules, thermostat_setpoint=thermostat_setpoints[i] if thermostat_setpoints is not None else thermostat_setpoints, ) # mechanical loads if simulate_mechanical: _simulation_id = f'{simulation_id}-mechanical' _output_directory = os.path.join(output_directory, _simulation_id) mechanical_simulator = self.end_use_load_profiles.simulate_building( ideal_loads=False, simulation_id=_simulation_id, output_directory=_output_directory, **_kwargs ).simulator else: mechanical_simulator = None # ideal loads _ideal_kwargs = deepcopy(_kwargs) if fixed_ideal_loads_idf is not None: _ideal_kwargs['model'] = fixed_ideal_loads_idf[i] _ideal_kwargs['osm'] = False else: pass _simulation_id = f'{simulation_id}-ideal' _output_directory = os.path.join(output_directory, _simulation_id) ideal_simulator = self.end_use_load_profiles.simulate_building( ideal_loads=True, simulation_id=_simulation_id, output_directory=_output_directory, **_ideal_kwargs ).simulator # partial loads partial_loads_simulators: List[EndUseLoadProfilesEnergyPlusPartialLoadSimulator] = [] kwargs_multiplier_minimum = partial_loads_kwargs.pop('multiplier_minimum', None) kwargs_multiplier_maximum = partial_loads_kwargs.pop('multiplier_maximum', None) kwargs_multiplier_probability = partial_loads_kwargs.pop('multiplier_probability', None) for i in range(partial_loads_simulations + 2): multiplier_minimum = kwargs_multiplier_minimum multiplier_maximum = kwargs_multiplier_maximum multiplier_probability = kwargs_multiplier_probability if i == 0: reference_name = 'ideal' multiplier_probability = 0 elif i == 1: reference_name = 'free_float' multiplier_minimum = 0 multiplier_maximum = 0 else: reference_name = 'undercool_overcool_underheat_overheat' _simulation_id = f'{simulation_id}-partial-{reference_name}-{i}' _output_directory = os.path.join(output_directory, _simulation_id) _ = partial_loads_kwargs.pop('simulation_id', None) _ = partial_loads_kwargs.pop('output_directory', None) _ = partial_loads_kwargs.pop('random_seed', None) partial_loads_simulators.append(EndUseLoadProfilesEnergyPlusPartialLoadSimulator( ideal_loads_simulator=deepcopy(ideal_simulator), multiplier_minimum=multiplier_minimum, multiplier_maximum=multiplier_maximum, multiplier_probability=multiplier_probability, simulation_id=_simulation_id, output_directory=_output_directory, random_seed=int(bldg_id) + i, **partial_loads_kwargs )) EndUseLoadProfilesEnergyPlusPartialLoadSimulator.multi_simulate(partial_loads_simulators, max_workers=self.max_workers) simulators.append({ 'mechanical': mechanical_simulator, 'ideal': ideal_simulator, 'partial': partial_loads_simulators }) return simulators
[docs] def sample_buildings( self, filters: Mapping[str, List[Any]] = None, sample_method: SampleMethod = None, sample_count: int = None, duplicate_to_count: bool = None, single_county: bool = None, single_family_detached: bool = None, **kwargs ) -> Tuple[List[int], List[int], Mapping[str, Any]]: sample_method = SampleMethod.RANDOM if sample_method is None else sample_method valid_sample_method = [v for v in SampleMethod] assert sample_method in valid_sample_method, f'Valid sample methods are {valid_sample_method}.' sample_count = 100 if sample_count is None else sample_count duplicate_to_count = True if duplicate_to_count is None else duplicate_to_count single_county = True if single_county is None else single_county single_family_detached = True if single_family_detached is None else single_family_detached nprs = np.random.RandomState(self.random_seed) sample_metadata = None if single_family_detached: filters = {} if filters is None else filters filters[self.__BUILDING_TYPE_COLUMN] = [self.__SINGLE_FAMILY_BUILDING_TYPE_NAME] else: pass metadata = self.end_use_load_profiles.metadata.metadata.get(filters) if single_county: county = nprs.choice(metadata[self.__COUNTY_COLUMN].unique(), 1)[0] metadata = metadata[metadata[self.__COUNTY_COLUMN]==county].copy() else: pass if sample_method == SampleMethod.RANDOM: metadata['label'] = 0 elif sample_method == SampleMethod.METADATA_CLUSTER_FREQUENCY: mc = MetadataClustering(self.end_use_load_profiles, metadata.index.tolist(), random_seed=self.random_seed, **kwargs) optimal_clusters, scores, labels = mc.cluster() sample_metadata = { 'optimal_clusters': optimal_clusters, 'scores': scores, 'labels': labels } metadata = metadata.merge(labels[labels['clusters']==optimal_clusters].set_index('bldg_id'), left_index=True, right_index=True) metadata['label_count'] = metadata.groupby('label')['label'].transform('count') metadata = metadata.sample(sample_count, weights='label_count', replace=duplicate_to_count, random_state=self.random_seed) bldg_ids = metadata.index.tolist() labels = metadata['label'].tolist() return bldg_ids, labels, sample_metadata