name: rl_trainer version: 0.1.0 description: Reinforcement learning agent training (PPO on GPU node) compute: gpu: true gpu_memory_gb: 8 location: remote preferred_hosts: [] requires_llm: false env: RL_MODEL: "ppo_trader" TRAINING_STEPS: "100000"