-
Notifications
You must be signed in to change notification settings - Fork 0
/
config_HAN.ini
80 lines (60 loc) · 1015 Bytes
/
config_HAN.ini
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
[MAIN]
mode = hanoi
NN = False
[HANOI]
; N Pegs [3 - 5]
pegs = 3
; N Discs [2 - 6]
discs = 4
[CARTPOLE]
; Pole Length [0.1 - 1]
pole_length = 0.5
; Pole Mass [0.05 - 0.5]
pole_mass = 0.1
; Gravity [-15, -5]
gravity = -9.8
; Timestep [0.01, 0.1]
timestep = 0.02
[GAMBLER]
; Win probability [0 - 1]
win_prob = 0.4
[GLOBALS]
Input_neurons = 12
Activation_function = relu
batch_size = 8
optimizer = adam
episodes = 2200
time_steps = 300
verbose: False
; TASK (Discount | Trace Decay | Epsilon)
; HANOI ( 1 | 0.5 | 1 )
; CARTPOLE ( 0.5 | 0.7 | 0.5)
; GAMBLER ??
critic_lr=0.5
actor_lr=0.5
discount=1
trace_decay=0.5
epsilon=1
Layers = 2
; TASK ( Layers | Neurons | Act )
; HANOI ( 3 | 6 | relu -> sigmoid )
; CARTPOLE ( 3 | 6 | relu -> sigmoid )
; GAMBLER ( ?? )
[LAYER1]
neurons = 10
act = relu
[LAYER2]
neurons = 10
act = relu
;[LAYER3]
;neurons = 12
;act = relu
;[LAYER4]
;neurons = 15
;act = relu
;
;[LAYER5]
;neurons = 15
;act = relu
[OUTPUT]
act = sigmoid