-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdpop_small.toml
85 lines (73 loc) · 1.71 KB
/
dpop_small.toml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
[pop]
node_features = 6
edge_features = 14
agent_neighbourhood_radius = 1
decentralized = false
epsilon_beta_scheduling = true
enable_power_supply_modularity = true # rte community detection works only this way
manager_history_size = 1e5
manager_initialization_half_life = 26 # 2 * substations
agent_type = "uniform"
[agent]
embedding = "egat_architecture_small"
advantage_stream = "advantage_stream_small"
value_stream = "value_stream_small"
learning_rate = 1e-2
learning_frequency = 4
target_network_weight_replace_steps = 500
gamma = 0.99
huber_loss_delta = 1.0
batch_size = 4
[agent.exploration]
method = "epsilon greedy"
max_epsilon = 1.0
min_epsilon = 0.01
epsilon_decay = 200
[agent.replay_memory]
alpha = 0.5
max_beta = 1.0
min_beta = 0.0
beta_decay = 200
capacity = 1000
[manager]
embedding = "egat_architecture_very_small"
advantage_stream = "advantage_stream_small"
value_stream = "value_stream_small"
learning_rate = 1e-2
learning_frequency = 4
target_network_weight_replace_steps = 500
gamma = 0.99
huber_loss_delta = 1.0
batch_size = 4
[manager.exploration]
method = "epsilon greedy"
max_epsilon = 1.0
min_epsilon = 0.01
epsilon_decay = 200
[manager.replay_memory]
alpha = 0.5
max_beta = 1.0
min_beta = 0.0
beta_decay = 200
capacity = 1000
[head_manager]
embedding = "gat_architecture_small"
advantage_stream = "advantage_stream_small"
value_stream = "value_stream_small"
learning_rate = 1e-2
learning_frequency = 4
target_network_weight_replace_steps = 500
gamma = 0.99
huber_loss_delta = 1.0
batch_size = 4
[head_manager.exploration]
method = "epsilon greedy"
max_epsilon = 1.0
min_epsilon = 0.01
epsilon_decay = 200
[head_manager.replay_memory]
alpha = 0.5
max_beta = 1.0
min_beta = 0.0
beta_decay = 200
capacity = 1000