Add model training with graphs and current stats, improve model with better rewarding system

2026-01-01 04:23:47 +01:00 · 2025-11-15 18:54:37 +01:00
parent 32477def6a
commit 05f568a457
10 changed files with 204 additions and 92 deletions
--- a/train.py
+++ b/train.py
@@ -1,20 +0,0 @@
-from stable_baselines3 import PPO
-from utils.ml import SpaceInvadersEnv
-
-env = SpaceInvadersEnv()
-model = PPO(
-    "MlpPolicy", 
-    env, 
-    n_steps=2048,
-    batch_size=64,
-    n_epochs=10,
-    learning_rate=3e-4,
-    verbose=1, 
-    device="cpu", 
-    gamma=0.99, 
-    ent_coef=0.02,
-    clip_range=0.2,
-    gae_lambda=0.95
-)
-model.learn(1_000_000)
-model.save("invader_agent")