-
Notifications
You must be signed in to change notification settings - Fork 236
/
utils.py
53 lines (41 loc) · 1.62 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
import numpy as np
from enum import Enum
class ScoreMode(Enum):
"""Different ways we might consider scoring our runs. This is for BO's sake, not for our RL agent -
ie helps us decide which hyper combos to pursue."""
MEAN = 1 # mean of all episodes
LAST = 2 # final episode (the one w/o killing)
POS = 3 # max # positive tests
CONSECUTIVE_POS = 4 # max # *consecutive* positives
TOTAL = 5
MIX = 6
MODE = ScoreMode.MEAN
def calculate_score(scores):
for i, a in enumerate(scores):
if a == 0.: scores[i] = -1.
if MODE == ScoreMode.MEAN:
return np.mean(scores)
elif MODE == ScoreMode.LAST:
return scores[-1]
elif MODE == ScoreMode.MIX:
return np.mean(scores[:-1]) + scores[-1]
elif MODE == ScoreMode.POS:
return sum(1 for x in scores if x > 0)
elif MODE == ScoreMode.TOTAL:
return sum(x for x in scores)
elif MODE == ScoreMode.CONSECUTIVE_POS:
score, curr_consec = 0, 0
for i, adv in enumerate(scores):
if adv > 0:
curr_consec += 1
continue
if curr_consec > score:
score = curr_consec
curr_consec = 0
return score
def add_common_args(parser):
parser.add_argument('-g', '--gpu-split', type=float, default=1, help="Num ways we'll split the GPU (how many tabs you running?)")
parser.add_argument('--autoencode', action="store_true", help="If you're running out of GPU memory, try --autoencode which scales things down")
last_good_commit = '6a6e49c'
def raise_refactor():
raise NotImplemented(f'Restore from {last_good_commit}')