mirror of
https://github.com/csd4ni3l/fleet-commander.git
synced 2026-01-01 04:23:47 +01:00
add better model, improve rewards
This commit is contained in:
3
.gitignore
vendored
3
.gitignore
vendored
@@ -180,4 +180,5 @@ test*.py
|
|||||||
logs/
|
logs/
|
||||||
logs
|
logs
|
||||||
settings.json
|
settings.json
|
||||||
training_logs
|
training_logs
|
||||||
|
*.bck*
|
||||||
BIN
invader_agent.zip
Normal file
BIN
invader_agent.zip
Normal file
Binary file not shown.
@@ -178,7 +178,7 @@ class SpaceInvadersEnv(gym.Env):
|
|||||||
nearest = self._nearest_enemy()
|
nearest = self._nearest_enemy()
|
||||||
alignment = abs(nearest.center_x - self.player.center_x) / self.width
|
alignment = abs(nearest.center_x - self.player.center_x) / self.width
|
||||||
if alignment < 0.025:
|
if alignment < 0.025:
|
||||||
reward += 0.1
|
reward += 0.005
|
||||||
|
|
||||||
self.player.center_x = np.clip(self.player.center_x, 0, self.width)
|
self.player.center_x = np.clip(self.player.center_x, 0, self.width)
|
||||||
self.player_speed = (self.player.center_x - prev_x) / max(1e-6, PLAYER_SPEED)
|
self.player_speed = (self.player.center_x - prev_x) / max(1e-6, PLAYER_SPEED)
|
||||||
@@ -260,11 +260,11 @@ class SpaceInvadersEnv(gym.Env):
|
|||||||
self.bullets.append(b)
|
self.bullets.append(b)
|
||||||
|
|
||||||
if self.player_alive:
|
if self.player_alive:
|
||||||
edge_threshold = self.width * 0.15
|
edge_threshold = self.width * 0.1
|
||||||
if self.player.center_x < edge_threshold or self.player.center_x > self.width - edge_threshold:
|
if self.player.center_x < edge_threshold or self.player.center_x > self.width - edge_threshold:
|
||||||
reward -= 0.03
|
reward -= 0.03
|
||||||
|
|
||||||
reward -= 0.0025
|
reward -= 0.01
|
||||||
|
|
||||||
obs = self._obs()
|
obs = self._obs()
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user