9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115 | def cv_model(config: dict, fun_control: dict) -> float:
"""
Performs k-fold cross-validation on a model using the given configuration and function control parameters.
Args:
config (dict): A dictionary containing the configuration parameters for the model.
fun_control (dict): A dictionary containing the function control parameters.
Returns:
(float): The mean average precision at k (MAP@k) score of the model.
Examples:
>>> config = {
... "initialization": "Xavier",
... "batch_size": 32,
... "patience": 10,
... }
>>> fun_control = {
... "_L_in": 10,
... "_L_out": 1,
... "_L_cond": 0,
... "enable_progress_bar": True,
... "core_model": MyModel,
... "num_workers": 4,
... "DATASET_PATH": "./data",
... "CHECKPOINT_PATH": "./checkpoints",
... "TENSORBOARD_PATH": "./tensorboard",
... "k_folds": 5,
... }
>>> mapk_score = cv_model(config, fun_control)
"""
_L_in = fun_control["_L_in"]
_L_out = fun_control["_L_out"]
_L_cond = fun_control["_L_cond"]
_torchmetric = fun_control["_torchmetric"]
if fun_control["enable_progress_bar"] is None:
enable_progress_bar = False
else:
enable_progress_bar = fun_control["enable_progress_bar"]
# Add "CV" postfix to config_id
config_id = generate_config_id(config, timestamp=True) + "_CV"
results = []
num_folds = fun_control["k_folds"]
split_seed = 12345
for k in range(num_folds):
print("k:", k)
model = fun_control["core_model"](**config, _L_in=_L_in, _L_out=_L_out, _L_cond=_L_cond, _torchmetric=_torchmetric)
if fun_control["data_module"] is None:
dm = LightCrossValidationDataModule(
k=k,
num_splits=num_folds,
split_seed=split_seed,
dataset=fun_control["data_set"],
data_full_train=fun_control["data_full_train"],
data_test=fun_control["data_test"],
data_val=fun_control["data_val"],
num_workers=fun_control["num_workers"],
batch_size=config["batch_size"],
data_dir=fun_control["DATASET_PATH"],
scaler=fun_control["scaler"],
verbosity=fun_control["verbosity"],
)
else:
dm = fun_control["data_module"]
dm.setup()
dm.prepare_data()
# TODO: Check if this is necessary:
# dm.setup()
# Init trainer
trainer = L.Trainer(
# Where to save models
default_root_dir=os.path.join(fun_control["CHECKPOINT_PATH"], config_id),
max_epochs=model.hparams.epochs,
accelerator=fun_control["accelerator"],
devices=fun_control["devices"],
strategy=fun_control["strategy"],
num_nodes=fun_control["num_nodes"],
precision=fun_control["precision"],
logger=TensorBoardLogger(
save_dir=fun_control["TENSORBOARD_PATH"],
version=config_id,
default_hp_metric=True,
log_graph=fun_control["log_graph"],
),
callbacks=[EarlyStopping(monitor="val_loss", patience=config["patience"], mode="min", strict=False, verbose=False)],
enable_progress_bar=enable_progress_bar,
)
# Pass the datamodule as arg to trainer.fit to override model hooks :)
trainer.fit(model=model, datamodule=dm)
# Test best model on validation and test set
# result = trainer.validate(model=model, datamodule=dm, ckpt_path="last")
verbose = fun_control["verbosity"] > 0
score = trainer.validate(model=model, datamodule=dm, verbose=verbose)
# unlist the result (from a list of one dict)
score = score[0]
print(f"train_model result: {score}")
results.append(score["val_loss"])
score = sum(results) / num_folds
# print(f"cv_model mapk result: {mapk_score}")
return score
|