From 0a62778df91d62c80db5dc3bcf2af2a0f94c18e9 Mon Sep 17 00:00:00 2001 From: mastoffel Date: Wed, 2 Oct 2024 18:34:24 +0100 Subject: [PATCH 1/8] add seperate dec enc hidden layers --- .../emulators/conditional_neural_process.py | 58 +++++++++---------- autoemulate/emulators/light_gbm.py | 4 +- .../emulators/neural_networks/cnp_module.py | 27 ++++++--- tests/models/test_cnp.py | 8 +-- 4 files changed, 55 insertions(+), 42 deletions(-) diff --git a/autoemulate/emulators/conditional_neural_process.py b/autoemulate/emulators/conditional_neural_process.py index 14b54d76..be21877f 100644 --- a/autoemulate/emulators/conditional_neural_process.py +++ b/autoemulate/emulators/conditional_neural_process.py @@ -42,8 +42,10 @@ class ConditionalNeuralProcess(RegressorMixin, BaseEstimator): The number of hidden units in the neural network layers. latent_dim : int, default=64 The dimensionality of the latent space. - hidden_layers : int, default=3 - The number of hidden layers in the neural network. + hidden_layers_enc : int, default=3 + The number of hidden layers in the encoder. + hidden_layers_dec : int, default=3 + The number of hidden layers in the decoder. min_context_points : int, default=3 The minimum number of context points to use during training. max_context_points : int, default=10 @@ -108,14 +110,15 @@ def __init__( # architecture hidden_dim=64, latent_dim=64, - hidden_layers=3, + hidden_layers_enc=3, + hidden_layers_dec=3, # data per episode min_context_points=3, max_context_points=10, n_episode=32, # training max_epochs=100, - lr=1e-2, + lr=5e-2, batch_size=16, activation=nn.ReLU, optimizer=torch.optim.AdamW, @@ -127,7 +130,8 @@ def __init__( ): self.hidden_dim = hidden_dim self.latent_dim = latent_dim - self.hidden_layers = hidden_layers + self.hidden_layers_enc = hidden_layers_enc + self.hidden_layers_dec = hidden_layers_dec self.min_context_points = min_context_points self.max_context_points = max_context_points self.n_episode = n_episode @@ -184,7 +188,8 @@ def fit(self, X, y): module__output_dim=self.output_dim_, module__hidden_dim=self.hidden_dim, module__latent_dim=self.latent_dim, - module__hidden_layers=self.hidden_layers, + module__hidden_layers_enc=self.hidden_layers_enc, + module__hidden_layers_dec=self.hidden_layers_dec, module__activation=self.activation, dataset__min_context_points=self.min_context_points, dataset__max_context_points=self.max_context_points, @@ -193,11 +198,7 @@ def fit(self, X, y): lr=self.lr, batch_size=self.batch_size, optimizer=self.optimizer, - device=self.device - if self.device is not None - else "cuda" - if torch.cuda.is_available() - else "cpu", + device=self.device, dataset=CNPDataset, # special dataset to sample context and target sets criterion=CNPLoss, iterator_train__collate_fn=cnp_collate_fn, # special collate to different n in episodes @@ -260,31 +261,30 @@ def predict(self, X, return_std=False): def get_grid_params(search_type: str = "random"): param_space = { "max_epochs": [100, 200, 300], - "batch_size": [16, 32, 64], + "batch_size": [16, 32], "hidden_dim": [32, 64, 128], "latent_dim": [32, 64, 128], - "max_context_points": [10, 20, 30], - "hidden_layers": [1, 2, 3, 4, 5], + "max_context_points": [5, 10, 15], + "hidden_layers_enc": [2, 3, 4], + "hidden_layers_dec": [2, 3, 4], "activation": [ nn.ReLU, - # nn.Tanh, nn.GELU, - # nn.Sigmoid, ], - # ], - "optimizer": [torch.optim.AdamW, torch.optim.SGD], # + "optimizer": [torch.optim.AdamW], # + "lr": loguniform(1e-3, 2e-1), } - # match search_type: - # case "random": - # param_space |= { - # "lr": loguniform(1e-4, 1e-2), - # } - # case "bayes": - # param_space |= { - # "lr": Real(1e-4, 1e-2, prior="log-uniform"), - # } - # case _: - # raise ValueError(f"Invalid search type: {search_type}") + # # match search_type: + # case "random": + # param_space |= { + # "lr": loguniform(1e-4, 1e-2), + # } + # case "bayes": + # param_space |= { + # "lr": Real(1e-4, 1e-2, prior="log-uniform"), + # } + # case _: + # raise ValueError(f"Invalid search type: {search_type}") return param_space diff --git a/autoemulate/emulators/light_gbm.py b/autoemulate/emulators/light_gbm.py index 2d9df8e9..05851f79 100644 --- a/autoemulate/emulators/light_gbm.py +++ b/autoemulate/emulators/light_gbm.py @@ -108,7 +108,7 @@ def predict(self, X): def get_grid_params(self, search_type="random"): """Returns the grid parameters of the emulator.""" param_space_random = { - "boosting_type": ["gbdt", "dart"], + "boosting_type": ["gbdt"], "num_leaves": randint(10, 100), "max_depth": randint(-1, 12), "learning_rate": loguniform(0.001, 0.1), @@ -119,7 +119,7 @@ def get_grid_params(self, search_type="random"): } param_space_bayes = { - "boosting_type": Categorical(["gbdt", "dart"]), + "boosting_type": Categorical(["gbdt"]), "num_leaves": Integer(10, 100), "max_depth": Integer(-1, 12), "learning_rate": Real(0.001, 0.1, prior="log-uniform"), diff --git a/autoemulate/emulators/neural_networks/cnp_module.py b/autoemulate/emulators/neural_networks/cnp_module.py index db846ca5..712135cf 100644 --- a/autoemulate/emulators/neural_networks/cnp_module.py +++ b/autoemulate/emulators/neural_networks/cnp_module.py @@ -13,11 +13,17 @@ class Encoder(nn.Module): """ def __init__( - self, input_dim, output_dim, hidden_dim, latent_dim, hidden_layers, activation + self, + input_dim, + output_dim, + hidden_dim, + latent_dim, + hidden_layers_enc, + activation, ): super().__init__() layers = [nn.Linear(input_dim + output_dim, hidden_dim), activation()] - for _ in range(hidden_layers): + for _ in range(hidden_layers_enc): layers.extend([nn.Linear(hidden_dim, hidden_dim), activation()]) layers.append(nn.Linear(hidden_dim, latent_dim)) self.net = nn.Sequential(*layers) @@ -53,11 +59,17 @@ def forward(self, x_context, y_context, context_mask=None): class Decoder(nn.Module): def __init__( - self, input_dim, latent_dim, hidden_dim, output_dim, hidden_layers, activation + self, + input_dim, + latent_dim, + hidden_dim, + output_dim, + hidden_layers_dec, + activation, ): super().__init__() layers = [nn.Linear(latent_dim + input_dim, hidden_dim), activation()] - for _ in range(hidden_layers): + for _ in range(hidden_layers_dec): layers.extend([nn.Linear(hidden_dim, hidden_dim), activation()]) self.net = nn.Sequential(*layers) self.mean_head = nn.Linear(hidden_dim, output_dim) @@ -94,15 +106,16 @@ def __init__( output_dim, hidden_dim, latent_dim, - hidden_layers, + hidden_layers_enc, + hidden_layers_dec, activation=nn.ReLU, ): super().__init__() self.encoder = Encoder( - input_dim, output_dim, hidden_dim, latent_dim, hidden_layers, activation + input_dim, output_dim, hidden_dim, latent_dim, hidden_layers_enc, activation ) self.decoder = Decoder( - input_dim, latent_dim, hidden_dim, output_dim, hidden_layers, activation + input_dim, latent_dim, hidden_dim, output_dim, hidden_layers_dec, activation ) def forward(self, X_context, y_context, X_target=None, context_mask=None): diff --git a/tests/models/test_cnp.py b/tests/models/test_cnp.py index 682f89d5..e4e46f2f 100644 --- a/tests/models/test_cnp.py +++ b/tests/models/test_cnp.py @@ -16,10 +16,10 @@ def encoder(): output_dim = 2 hidden_dim = 64 latent_dim = 32 - hidden_layers = 3 + hidden_layers_enc = 3 activation = nn.ReLU return Encoder( - input_dim, output_dim, hidden_dim, latent_dim, hidden_layers, activation + input_dim, output_dim, hidden_dim, latent_dim, hidden_layers_enc, activation ) @@ -96,10 +96,10 @@ def decoder(): latent_dim = 64 hidden_dim = 128 output_dim = 1 - hidden_layers = 3 + hidden_layers_dec = 5 activation = nn.ReLU return Decoder( - input_dim, latent_dim, hidden_dim, output_dim, hidden_layers, activation + input_dim, latent_dim, hidden_dim, output_dim, hidden_layers_dec, activation ) From b64d6cadfddc4ad80225467d00de08b9740b510a Mon Sep 17 00:00:00 2001 From: mastoffel Date: Wed, 9 Oct 2024 14:01:52 +0100 Subject: [PATCH 2/8] optimise cnp --- autoemulate/emulators/conditional_neural_process.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/autoemulate/emulators/conditional_neural_process.py b/autoemulate/emulators/conditional_neural_process.py index be21877f..29b15751 100644 --- a/autoemulate/emulators/conditional_neural_process.py +++ b/autoemulate/emulators/conditional_neural_process.py @@ -118,13 +118,13 @@ def __init__( n_episode=32, # training max_epochs=100, - lr=5e-2, + lr=5e-3, batch_size=16, activation=nn.ReLU, optimizer=torch.optim.AdamW, normalize_y=True, # misc - device=None, + device="cpu", random_state=None, attention=False, ): @@ -272,7 +272,7 @@ def get_grid_params(search_type: str = "random"): nn.GELU, ], "optimizer": [torch.optim.AdamW], # - "lr": loguniform(1e-3, 2e-1), + "lr": loguniform(5e-4, 1e-3, 5e-3, 1e-2), } # # match search_type: # case "random": From 583f9fb54160229dffa6587f2a45583eb1bea924 Mon Sep 17 00:00:00 2001 From: mastoffel Date: Wed, 9 Oct 2024 14:38:09 +0100 Subject: [PATCH 3/8] remove some param search options from svm --- autoemulate/emulators/support_vector_machines.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/autoemulate/emulators/support_vector_machines.py b/autoemulate/emulators/support_vector_machines.py index d0b0fbcb..65f98e68 100644 --- a/autoemulate/emulators/support_vector_machines.py +++ b/autoemulate/emulators/support_vector_machines.py @@ -134,8 +134,6 @@ def get_grid_params(self, search_type="random"): "C": uniform(1.0, 3.0), "epsilon": uniform(0.1, 0.3), "shrinking": [True, False], - "cache_size": randint(200, 401), - "verbose": [False], "max_iter": [-1], } From 934ec4bd2045dfa16a3362df3154692c8b7d593d Mon Sep 17 00:00:00 2001 From: mastoffel Date: Thu, 10 Oct 2024 10:12:47 +0100 Subject: [PATCH 4/8] tweak rf --- autoemulate/emulators/random_forest.py | 32 ++++---------------------- 1 file changed, 4 insertions(+), 28 deletions(-) diff --git a/autoemulate/emulators/random_forest.py b/autoemulate/emulators/random_forest.py index 6173f2e2..ca505133 100644 --- a/autoemulate/emulators/random_forest.py +++ b/autoemulate/emulators/random_forest.py @@ -100,18 +100,18 @@ def get_grid_params(self, search_type="random"): "n_estimators": randint(50, 500), "min_samples_split": randint(2, 20), "min_samples_leaf": randint(1, 10), - "max_features": [None, "sqrt", "log2"], + "max_features": ["sqrt", "log2", None, 1.0], "bootstrap": [True, False], "oob_score": [True, False], - # # "max_depth": [None] + list(range(3, 20)), # None plus a range of depths - "max_samples": [None, 0.5, 0.75], + "max_depth": [None] + list(range(5, 30, 5)), # None plus a range of depths + "max_samples": [None, 0.5, 0.7, 0.9], } param_space_bayes = { "n_estimators": Integer(50, 500), "min_samples_split": Integer(2, 20), "min_samples_leaf": Integer(1, 10), - "max_features": Categorical([None, "sqrt", "log2"]), + "max_features": ["sqrt", "log2", 1.0, None], "bootstrap": Categorical([True, False]), "oob_score": Categorical([True, False]), # "max_depth": Categorical([None] + list(range(3, 20))), # None plus a range of depths @@ -131,27 +131,3 @@ def model_name(self): def _more_tags(self): return {"multioutput": True} - - # def score(self, X, y, metric): - # """Returns the score of the emulator. - - # Parameters - # ---------- - # X : array-like, shape (n_samples, n_features) - # Simulation input. - # y : array-like, shape (n_samples, n_outputs) - # Simulation output. - # metric : str - # Name of the metric to use, currently either rsme or r2. - # Returns - # ------- - # metric : float - # Metric of the emulator. - - # """ - # predictions = self.predict(X) - # return metric(y, predictions) - - # def _more_tags(self): - # return {'non_deterministic': True, - # 'multioutput': True} From 70b974bac8d6b6dd943d7b3aa0dff422c74303ca Mon Sep 17 00:00:00 2001 From: mastoffel Date: Thu, 10 Oct 2024 10:24:57 +0100 Subject: [PATCH 5/8] tweak gb --- autoemulate/emulators/gradient_boosting.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/autoemulate/emulators/gradient_boosting.py b/autoemulate/emulators/gradient_boosting.py index 5f67b754..e6f21295 100644 --- a/autoemulate/emulators/gradient_boosting.py +++ b/autoemulate/emulators/gradient_boosting.py @@ -109,7 +109,7 @@ def get_grid_params(self, search_type="random"): "min_samples_leaf": randint(1, 6), "subsample": uniform(0.6, 0.4), # 0.4 is the range width (1.0 - 0.6) "max_features": ["sqrt", "log2", None], - "ccp_alpha": loguniform(0.01, 0.1), + "ccp_alpha": loguniform(0.001, 0.1), } param_space_bayes = { From 144b818bfdc77eda272199c1e56d4623b6169880 Mon Sep 17 00:00:00 2001 From: mastoffel Date: Thu, 10 Oct 2024 11:18:38 +0100 Subject: [PATCH 6/8] cleanup rbf --- autoemulate/emulators/radial_basis_functions.py | 7 +------ 1 file changed, 1 insertion(+), 6 deletions(-) diff --git a/autoemulate/emulators/radial_basis_functions.py b/autoemulate/emulators/radial_basis_functions.py index 11fcbdd5..19a419d1 100644 --- a/autoemulate/emulators/radial_basis_functions.py +++ b/autoemulate/emulators/radial_basis_functions.py @@ -85,12 +85,7 @@ def predict(self, X): def get_grid_params(self, search_type="random"): """Returns the grid parameters of the emulator.""" - # param_space_random = { - # #"smoothing": uniform(0.0, 1.0), - # "kernel": ["linear", "thin_plate_spline", "cubic", "quintic", "multiquadric", "inverse_multiquadric", "gaussian"], - # #"epsilon": uniform(0.0, 1.0), - # "degree": randint(0, 5), - # } + param_space_random = [ { "kernel": ["linear", "multiquadric"], From 8abfcf93477a7783bed99ddf164bc812ab254d3c Mon Sep 17 00:00:00 2001 From: mastoffel Date: Thu, 10 Oct 2024 12:02:18 +0100 Subject: [PATCH 7/8] tweak device param --- autoemulate/emulators/gaussian_process_torch.py | 8 ++------ 1 file changed, 2 insertions(+), 6 deletions(-) diff --git a/autoemulate/emulators/gaussian_process_torch.py b/autoemulate/emulators/gaussian_process_torch.py index 3f5db025..92ef18b4 100644 --- a/autoemulate/emulators/gaussian_process_torch.py +++ b/autoemulate/emulators/gaussian_process_torch.py @@ -59,7 +59,7 @@ def __init__( max_epochs=50, normalize_y=True, # misc - device=None, + device="cpu", random_state=None, ): self.mean_module = mean_module @@ -167,11 +167,7 @@ def fit(self, X, y): ), ], verbose=0, - device=self.device - if self.device is not None - else "cuda" - if torch.cuda.is_available() - else "cpu", + device=self.device, ) self.model_.fit(X, y) self.is_fitted_ = True From b68c497b33b1c8fbbe9d70ff28ef0108e0e17436 Mon Sep 17 00:00:00 2001 From: mastoffel Date: Thu, 10 Oct 2024 13:26:36 +0100 Subject: [PATCH 8/8] remove unused imports --- autoemulate/compare.py | 8 -------- autoemulate/cross_validate.py | 2 -- .../emulators/conditional_neural_process.py | 1 - .../emulators/gaussian_process_sklearn.py | 1 - autoemulate/emulators/gaussian_process_torch.py | 17 ----------------- autoemulate/emulators/polynomials.py | 1 - autoemulate/emulators/random_forest.py | 1 - autoemulate/logging_config.py | 1 - autoemulate/model_processing.py | 3 --- autoemulate/plotting.py | 2 -- autoemulate/save.py | 4 ---- tests/models/test_cnp.py | 3 ++- 12 files changed, 2 insertions(+), 42 deletions(-) diff --git a/autoemulate/compare.py b/autoemulate/compare.py index 4c70b7f7..dee40c3e 100644 --- a/autoemulate/compare.py +++ b/autoemulate/compare.py @@ -1,16 +1,9 @@ -import matplotlib.pyplot as plt import numpy as np import pandas as pd from sklearn.base import BaseEstimator from sklearn.decomposition import PCA -from sklearn.metrics import make_scorer -from sklearn.model_selection import cross_validate from sklearn.model_selection import KFold -from sklearn.model_selection import PredefinedSplit -from sklearn.model_selection import train_test_split -from sklearn.pipeline import Pipeline from sklearn.preprocessing import StandardScaler -from sklearn.utils.validation import check_is_fitted from sklearn.utils.validation import check_X_y from tqdm.autonotebook import tqdm @@ -27,7 +20,6 @@ from autoemulate.plotting import _plot_model from autoemulate.printing import _print_setup from autoemulate.save import ModelSerialiser -from autoemulate.utils import _ensure_2d from autoemulate.utils import _get_full_model_name from autoemulate.utils import _redirect_warnings from autoemulate.utils import get_model_name diff --git a/autoemulate/cross_validate.py b/autoemulate/cross_validate.py index 50e45d27..9924cbd0 100644 --- a/autoemulate/cross_validate.py +++ b/autoemulate/cross_validate.py @@ -5,8 +5,6 @@ import pandas as pd from sklearn.metrics import make_scorer from sklearn.model_selection import cross_validate -from sklearn.model_selection import PredefinedSplit -from sklearn.model_selection import train_test_split from autoemulate.utils import get_model_name from autoemulate.utils import get_model_params diff --git a/autoemulate/emulators/conditional_neural_process.py b/autoemulate/emulators/conditional_neural_process.py index 29b15751..2f7d72d8 100644 --- a/autoemulate/emulators/conditional_neural_process.py +++ b/autoemulate/emulators/conditional_neural_process.py @@ -9,7 +9,6 @@ from sklearn.utils.validation import check_array from sklearn.utils.validation import check_is_fitted from sklearn.utils.validation import check_X_y -from skopt.space import Real from skorch import NeuralNetRegressor from skorch.callbacks import EarlyStopping from skorch.callbacks import GradientNormClipping diff --git a/autoemulate/emulators/gaussian_process_sklearn.py b/autoemulate/emulators/gaussian_process_sklearn.py index 41dbfe33..f4c1bd49 100644 --- a/autoemulate/emulators/gaussian_process_sklearn.py +++ b/autoemulate/emulators/gaussian_process_sklearn.py @@ -10,7 +10,6 @@ from sklearn.utils.validation import check_is_fitted from sklearn.utils.validation import check_X_y from skopt.space import Categorical -from skopt.space import Integer from skopt.space import Real from autoemulate.utils import _suppress_convergence_warnings diff --git a/autoemulate/emulators/gaussian_process_torch.py b/autoemulate/emulators/gaussian_process_torch.py index 92ef18b4..f9011fe3 100644 --- a/autoemulate/emulators/gaussian_process_torch.py +++ b/autoemulate/emulators/gaussian_process_torch.py @@ -1,30 +1,13 @@ -from copy import deepcopy - import gpytorch import numpy as np import torch -from scipy.stats import loguniform -from scipy.stats import randint from sklearn.base import BaseEstimator from sklearn.base import RegressorMixin -from sklearn.exceptions import DataConversionWarning -from sklearn.metrics import r2_score -from sklearn.model_selection import train_test_split from sklearn.preprocessing._data import _handle_zeros_in_scale from sklearn.utils import check_array from sklearn.utils import check_X_y from sklearn.utils.validation import check_is_fitted -from skopt.space import Categorical -from skopt.space import Integer -from skopt.space import Real -from skorch.callbacks import Checkpoint -from skorch.callbacks import EarlyStopping -from skorch.callbacks import EpochScoring from skorch.callbacks import LRScheduler -from skorch.callbacks import ProgressBar -from skorch.dataset import Dataset -from skorch.dataset import ValidSplit -from skorch.helper import predefined_split from skorch.probabilistic import ExactGPRegressor from autoemulate.emulators.gaussian_process_utils import EarlyStoppingCustom diff --git a/autoemulate/emulators/polynomials.py b/autoemulate/emulators/polynomials.py index f626019e..7c54e1bc 100644 --- a/autoemulate/emulators/polynomials.py +++ b/autoemulate/emulators/polynomials.py @@ -8,7 +8,6 @@ from sklearn.utils.validation import check_is_fitted from sklearn.utils.validation import check_X_y from skopt.space import Categorical -from skopt.space import Integer class SecondOrderPolynomial(BaseEstimator, RegressorMixin): diff --git a/autoemulate/emulators/random_forest.py b/autoemulate/emulators/random_forest.py index ca505133..bd85c0cc 100644 --- a/autoemulate/emulators/random_forest.py +++ b/autoemulate/emulators/random_forest.py @@ -7,7 +7,6 @@ from sklearn.utils.validation import check_X_y from skopt.space import Categorical from skopt.space import Integer -from skopt.space import Real class RandomForest(BaseEstimator, RegressorMixin): diff --git a/autoemulate/logging_config.py b/autoemulate/logging_config.py index 62a863dc..0e9f13ff 100644 --- a/autoemulate/logging_config.py +++ b/autoemulate/logging_config.py @@ -1,7 +1,6 @@ import logging import os import sys -import warnings from pathlib import Path diff --git a/autoemulate/model_processing.py b/autoemulate/model_processing.py index 54d54685..65da5850 100644 --- a/autoemulate/model_processing.py +++ b/autoemulate/model_processing.py @@ -2,9 +2,6 @@ from sklearn.multioutput import MultiOutputRegressor from sklearn.pipeline import Pipeline -from autoemulate.utils import get_model_name -from autoemulate.utils import get_short_model_name - def _turn_models_into_multioutput(models, y): """Turn single output models into multioutput models if y is 2D. diff --git a/autoemulate/plotting.py b/autoemulate/plotting.py index aba5c0d8..76b85678 100644 --- a/autoemulate/plotting.py +++ b/autoemulate/plotting.py @@ -1,5 +1,4 @@ import inspect -import time import matplotlib.pyplot as plt import numpy as np @@ -7,7 +6,6 @@ from sklearn.pipeline import Pipeline from autoemulate.utils import _ensure_2d -from autoemulate.utils import get_model_name def _validate_inputs(cv_results, model_name): diff --git a/autoemulate/save.py b/autoemulate/save.py index 0c491e4a..35abf1b6 100644 --- a/autoemulate/save.py +++ b/autoemulate/save.py @@ -1,10 +1,6 @@ -import json -import os from pathlib import Path import joblib -import numpy as np -import sklearn from autoemulate.utils import get_model_name diff --git a/tests/models/test_cnp.py b/tests/models/test_cnp.py index e4e46f2f..f650ae36 100644 --- a/tests/models/test_cnp.py +++ b/tests/models/test_cnp.py @@ -150,7 +150,8 @@ def cnp_module(): output_dim=1, hidden_dim=32, latent_dim=64, - hidden_layers=2, + hidden_layers_enc=2, + hidden_layers_dec=2, activation=nn.ReLU, )