forked from SymbioticLab/Fluid
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtune_hb_wlm.py
63 lines (47 loc) · 1.61 KB
/
tune_hb_wlm.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
from pathlib import Path
from ray import tune
from ray.tune.schedulers.hyperband import HyperBandScheduler
import workloads.common as com
from fluid.algo_random import VariantGenerator
from fluid.trainer import TorchTrainer
from workloads.common import wlm as workload
DATA_PATH, RESULTS_PATH = com.detect_paths()
EXP_NAME = com.remove_prefix(Path(__file__).stem, "tune_")
def setup_tune_scheduler(eta):
search_space = workload.create_search_space()
experiment_metrics = workload.exp_metric()
scheduler = HyperBandScheduler(
time_attr="training_iteration",
max_t=243,
reduction_factor=eta,
**experiment_metrics
)
return dict(
search_alg=VariantGenerator(),
scheduler=scheduler,
config=search_space,
resources_per_trial=com.detect_baseline_resource(),
)
def main():
eta, sd = com.init_ray()
eta = 3 if eta == 1 else eta
MyTrainable = TorchTrainer.as_trainable(
data_creator=workload.data_creator,
model_creator=workload.model_creator,
loss_creator=workload.loss_creator,
optimizer_creator=workload.optimizer_creator,
training_operator_cls=workload.WLMOperator,
config={"seed": sd, "extra_fluid_trial_resources": {}},
)
params = {
**com.run_options(__file__),
"stop": workload.create_stopper(),
**setup_tune_scheduler(eta),
}
analysis = tune.run(MyTrainable, **params)
dfs = analysis.trial_dataframes
for logdir, df in dfs.items():
ld = Path(logdir)
df.to_csv(ld / "trail_dataframe.csv")
if __name__ == "__main__":
main()