@@ -13,33 +13,33 @@ class InteractivePolicy(Policy):
1313 def __init__ (self , env , agent_index ):
1414 super (InteractivePolicy , self ).__init__ ()
1515 self .env = env
16- # hard-coded keyborad events
16+ # hard-coded keyboard events
1717 self .move = [False for i in range (4 )]
1818 self .comm = [False for i in range (env .world .dim_c )]
19- # register keyboard events with this envornment 's window
19+ # register keyboard events with this environment 's window
2020 env .viewers [agent_index ].window .on_key_press = self .key_press
2121 env .viewers [agent_index ].window .on_key_release = self .key_release
2222
2323 def action (self , obs ):
2424 # ignore observation and just act based on keyboard events
25- if self .env .discrete_action_space :
25+ if self .env .discrete_action_input :
2626 u = 0
2727 if self .move [0 ]: u = 1
2828 if self .move [1 ]: u = 2
2929 if self .move [2 ]: u = 4
3030 if self .move [3 ]: u = 3
3131 else :
32- u = np .array ([0.0 ,0.0 ])
33- if self .move [0 ]: u [0 ] - = 1.0
34- if self .move [1 ]: u [0 ] += 1.0
35- if self .move [2 ]: u [1 ] += 1.0
36- if self .move [3 ]: u [1 ] - = 1.0
32+ u = np .array ([0.0 ,0.0 , 0.0 , 0.0 ])
33+ if self .move [0 ]: u [0 ] + = 1.0
34+ if self .move [1 ]: u [1 ] += 1.0
35+ if self .move [2 ]: u [2 ] += 1.0
36+ if self .move [3 ]: u [3 ] + = 1.0
3737 c = 0
3838 for i in range (len (self .comm )):
3939 if self .comm [i ]: c = i + 1
4040 return [u , c ]
4141
42- # keyborad event callbacks
42+ # keyborad event callbacks
4343 def key_press (self , k , mod ):
4444 if k == key .LEFT : self .move [0 ] = True
4545 if k == key .RIGHT : self .move [1 ] = True
@@ -53,4 +53,4 @@ def key_release(self, k, mod):
5353 if k == key .UP : self .move [2 ] = False
5454 if k == key .DOWN : self .move [3 ] = False
5555 for i in range (len (self .comm )):
56- if k == key ._1 + i : self .comm [i ] = False
56+ if k == key ._1 + i : self .comm [i ] = False
0 commit comments