-
Notifications
You must be signed in to change notification settings - Fork 16
/
FHP_NFSP.py
32 lines (27 loc) · 991 Bytes
/
FHP_NFSP.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
import numpy as np
from HYPERS import *
from NFSP.TrainingProfile import TrainingProfile
from NFSP.workers.driver.Driver import Driver
from PokerRL import Flop3Holdem
if __name__ == '__main__':
ctrl = Driver(t_prof=TrainingProfile(
name="FHP_NFSP_v001_SEED" + str(np.random.randint(1000000)),
game_cls=Flop3Holdem,
eps_const=0.005,
eps_start=0.08,
target_net_update_freq=1000,
min_prob_add_res_buf=0.25,
lr_avg=0.01,
lr_br=0.1,
n_learner_actor_workers=N_LA_FHP_NFSP,
res_buf_size_each_la=int(2e7 / N_LA_FHP_NFSP),
cir_buf_size_each_la=int(6e5 / N_LA_FHP_NFSP),
n_steps_per_iter_per_la=int(256 / N_LA_FHP_NFSP),
mini_batch_size_br_per_la=int(256 / N_LA_FHP_NFSP),
mini_batch_size_avg_per_la=int(256 / N_LA_FHP_NFSP),
DISTRIBUTED=True,
rlbr_args=DIST_RLBR_ARGS_games,
),
eval_methods={"rlbr": 200000},
n_iterations=None)
ctrl.run()