-
Notifications
You must be signed in to change notification settings - Fork 4
/
rs2.yaml
68 lines (68 loc) · 1.16 KB
/
rs2.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
method: grid
metric:
goal: maximize
name: eval_vs_GreedyBattleAgent/win_rate
name: rs2
parameters:
act-fun:
value: relu
adversary:
value: self-play
cliprange:
value: 0.2
concurrency:
value: 4
draft-agent:
value: inspirai
ent-coef:
value: 0.005
eval-battle-agents:
value: greedy
eval-episodes:
value: 250
gamma:
value: 0.99
layers:
value: 1
learning-rate:
value: 0.005838104376218821
n-steps:
value: 4096
neurons:
value: 501
nminibatches-divider:
value: 1
noptepochs:
value: 2
num-evals:
value: 100
path:
value: gym_locm/experiments/papers/entcom-2023/sweep/rs2
reward-functions:
value: coac
reward-weights:
value: 1
role:
value: alternate
seed:
values:
- 73667418
- 74896946
- 28835729
- 38458274
- 68531181
- 34553231
- 8256697
- 79863286
switch-freq:
value: 100
task:
value: battle
train-episodes:
value: 100000
version:
value: "1.5"
vf-coef:
value: 1
program: gym_locm/experiments/training.py
project: entcom-2023