-
Notifications
You must be signed in to change notification settings - Fork 6
/
Copy pathHumanControl.py
58 lines (49 loc) · 1.31 KB
/
HumanControl.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
from pyglet.window import key
import numpy as np
from .Agar_env.Env import AgarEnv
import time
render = True
num_agents = 2
class Args():
def __init__(self):
self.num_controlled_agent = num_agents
self.num_processes = 64
self.action_repeat = 1
self.total_step = 1e8
self.gamma = 0.99
self.eval = True
env = AgarEnv(Args())
env.seed(0)
step = 1
window = None
action = np.zeros((num_agents, 3))
def on_mouse_motion(x, y, dx, dy):
action[0][0] = (x / 1920 - 0.5) * 2
action[0][1] = (y / 1080 - 0.5) * 2
def on_key_press(k, modifiers):
if k == key.SPACE:
action[0][2] = 1
else:
action[0][2] = 0
start = time.time()
ca = 100
for episode in range(1):
observation = env.reset()
while ca:
ca -= 1
time.sleep(0.05)
if step % 40 == 0:
print('step', step)
print(step / (time.time() - start))
if render:
env.render(0)
if not window:
window = env.viewer.window
window.on_key_press = on_key_press
window.on_mouse_motion = on_mouse_motion
a = action.reshape(-1)
observations, rewards, done, info = env.step(a)
#print(step, rewards)
action[0][2] = 0
step+=1
env.close()