forked from EricSteinberger/DREAM
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathFHP_DREAM.py
31 lines (25 loc) · 971 Bytes
/
FHP_DREAM.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
import numpy as np
from DREAM_and_DeepCFR.TrainingProfile import TrainingProfile
from DREAM_and_DeepCFR.workers.driver.Driver import Driver
from HYPERS import *
from PokerRL import Flop3Holdem
if __name__ == '__main__':
ctrl = Driver(t_prof=TrainingProfile(
name="FHP_DREAM_v001_SEED" + str(np.random.randint(1000000)),
n_traversals_per_iter=(SDCFR_FHP_TRAVERSALS_OS / N_LA_FHP_CFR),
sampler="learned_baseline",
os_eps=OS_EPS,
n_batches_per_iter_baseline=2000,
batch_size_baseline=int(2048 / N_LA_FHP_CFR),
game_cls=Flop3Holdem,
n_batches_adv_training=SDCFR_FHP_BATCHES,
n_learner_actor_workers=N_LA_FHP_CFR,
mini_batch_size_adv=int(SDCFR_FHP_BATCH_SIZE / N_LA_FHP_CFR),
max_buffer_size_adv=int(4e7 / N_LA_FHP_CFR),
DISTRIBUTED=True,
rlbr_args=DIST_RLBR_ARGS_games,
),
eval_methods={
"rlbr": RL_BR_FREQ_CFR
})
ctrl.run()