Files
fleet-commander/train.py

20 lines
380 B
Python

from stable_baselines3 import PPO
from utils.ml import SpaceInvadersEnv
env = SpaceInvadersEnv()
model = PPO(
"MlpPolicy",
env,
n_steps=2048,
batch_size=64,
n_epochs=10,
learning_rate=3e-4,
verbose=1,
device="cpu",
gamma=0.99,
ent_coef=0.02,
clip_range=0.2,
gae_lambda=0.95
)
model.learn(1_000_000)
model.save("invader_agent")