forked from Kaiyotech/Opti
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathworker_recovery.py
136 lines (129 loc) · 5.18 KB
/
worker_recovery.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
import sys
from redis import Redis
from redis.retry import Retry
from redis.backoff import ExponentialBackoff
from redis.exceptions import ConnectionError, TimeoutError
from rlgym.envs import Match
from CoyoteObs import CoyoteObsBuilder
from rlgym.utils.terminal_conditions.common_conditions import GoalScoredCondition, TimeoutCondition, \
BallTouchedCondition
from mybots_terminals import BallTouchGroundCondition, PlayerTwoTouch, AttackerTouchCloseGoal, ReachObject
from rocket_learn.rollout_generator.redis.redis_rollout_worker import RedisRolloutWorker
from CoyoteParser import CoyoteAction
from rewards import ZeroSumReward
from torch import set_num_threads
from setter import CoyoteSetter
import Constants_recovery
import os
set_num_threads(1)
if __name__ == "__main__":
frame_skip = Constants_recovery.FRAME_SKIP
rew = ZeroSumReward(zero_sum=Constants_recovery.ZERO_SUM,
velocity_pb_w=0,
boost_gain_w=0.35,
boost_spend_w=4,
punish_boost=True,
touch_ball_w=2.5,
boost_remain_touch_w=2,
touch_grass_w=0,
supersonic_bonus_vpb_w=0,
zero_touch_grass_if_ss=False,
turtle_w=0,
final_reward_ball_dist_w=1,
final_reward_boost_w=0.3,
forward_ctrl_w=0,
tick_skip=Constants_recovery.FRAME_SKIP,
curve_wave_zap_dash_w=0.15,
walldash_w=0.35,
jump_high_speed_w=-0.1,
slow_w=-0.05,
)
fps = 120 // frame_skip
name = "Default"
send_gamestate = False
streamer_mode = False
local = True
auto_minimize = True
game_speed = 100
evaluation_prob = 0
past_version_prob = 0.1
deterministic_streamer = True
force_old_deterministic = False
gamemode_weights = {'1v1': 1, '2v2': 0, '3v3': 0}
team_size = 3
dynamic_game = True
host = "127.0.0.1"
if len(sys.argv) > 1:
host = sys.argv[1]
if host != "127.0.0.1" and host != "localhost":
local = False
if len(sys.argv) > 2:
name = sys.argv[2]
# if len(sys.argv) > 3 and not dynamic_game:
# team_size = int(sys.argv[3])
if len(sys.argv) > 3:
if sys.argv[3] == 'GAMESTATE':
send_gamestate = True
elif sys.argv[3] == 'STREAMER':
streamer_mode = True
evaluation_prob = 0
game_speed = 1
auto_minimize = False
gamemode_weights = {'1v1': 1, '2v2': 0, '3v3': 0}
match = Match(
game_speed=game_speed,
spawn_opponents=True,
team_size=team_size,
state_setter=CoyoteSetter(mode="recovery"),
obs_builder=CoyoteObsBuilder(expanding=True,
tick_skip=Constants_recovery.FRAME_SKIP,
team_size=3, extra_boost_info=False,
embed_players=False,
add_jumptime=True,
add_airtime=True,
add_fliptime=True,
add_boosttime=True,
add_handbrake=True),
action_parser=CoyoteAction(),
terminal_conditions=[GoalScoredCondition(),
TimeoutCondition(fps * 100),
# TimeoutCondition(fps * 2),
BallTouchedCondition(),
],
reward_function=rew,
tick_skip=frame_skip,
)
# local Redis
if local:
r = Redis(host=host,
username="user1",
password=os.environ["redis_user1_key"],
db=Constants_recovery.DB_NUM,
)
# remote Redis
else:
# noinspection PyArgumentList
r = Redis(host=host,
username="user1",
password=os.environ["redis_user1_key"],
retry_on_error=[ConnectionError, TimeoutError],
retry=Retry(ExponentialBackoff(cap=10, base=1), 25),
db=Constants_recovery.DB_NUM,
)
RedisRolloutWorker(r, name, match,
past_version_prob=past_version_prob,
sigma_target=2,
evaluation_prob=evaluation_prob,
force_paging=False,
dynamic_gm=dynamic_game,
send_obs=True,
auto_minimize=auto_minimize,
send_gamestates=send_gamestate,
gamemode_weights=gamemode_weights, # default 1/3
streamer_mode=streamer_mode,
deterministic_streamer=deterministic_streamer,
force_old_deterministic=force_old_deterministic,
# testing
batch_mode=True,
step_size=Constants_recovery.STEP_SIZE,
).run()