after a while of training i get this message on pyhton and the unity stops Code (CSharp): Traceback (most recent call last): File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer_controller.py", line 175, in start_learning n_steps = self.advance(env_manager) File "d:\python\python37\lib\site-packages\mlagents_envs\timers.py", line 305, in wrapped return func(*args, **kwargs) File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer_controller.py", line 250, in advance trainer.advance() File "d:\python\python37\lib\site-packages\mlagents\trainers\ghost\trainer.py", line 243, in advance self.trainer.advance() File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer\rl_trainer.py", line 274, in advance self._process_trajectory(t) File "d:\python\python37\lib\site-packages\mlagents\trainers\ppo\trainer.py", line 67, in _process_trajectory super()._process_trajectory(trajectory) File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer\rl_trainer.py", line 232, in _process_trajectory self._maybe_save_model(self.get_step + len(trajectory.steps)) File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer\rl_trainer.py", line 257, in _maybe_save_model self._checkpoint() File "d:\python\python37\lib\site-packages\mlagents_envs\timers.py", line 305, in wrapped return func(*args, **kwargs) File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer\rl_trainer.py", line 155, in _checkpoint checkpoint_path = self.model_saver.save_checkpoint(self.brain_name, self.step) File "d:\python\python37\lib\site-packages\mlagents\trainers\model_saver\torch_model_saver.py", line 56, in save_checkpoint torch.save(state_dict, os.path.join(self.model_path, "checkpoint.pt")) File "d:\python\python37\lib\site-packages\torch\serialization.py", line 369, in save with _open_file_like(f, 'wb') as opened_file: File "d:\python\python37\lib\site-packages\torch\serialization.py", line 230, in _open_file_like return _open_file(name_or_buffer, mode) File "d:\python\python37\lib\site-packages\torch\serialization.py", line 211, in __init__ super(_open_file, self).__init__(open(name, mode)) OSError: [Errno 22] Invalid argument: 'results\\one\\Balance\\checkpoint.pt' During handling of the above exception, another exception occurred: Traceback (most recent call last): File "d:\python\python37\lib\runpy.py", line 193, in _run_module_as_main "__main__", mod_spec) File "d:\python\python37\lib\runpy.py", line 85, in _run_code exec(code, run_globals) File "D:\Python\Python37\Scripts\mlagents-learn.exe\__main__.py", line 7, in <module> File "d:\python\python37\lib\site-packages\mlagents\trainers\learn.py", line 250, in main run_cli(parse_command_line()) File "d:\python\python37\lib\site-packages\mlagents\trainers\learn.py", line 246, in run_cli run_training(run_seed, options) File "d:\python\python37\lib\site-packages\mlagents\trainers\learn.py", line 125, in run_training tc.start_learning(env_manager) File "d:\python\python37\lib\site-packages\mlagents_envs\timers.py", line 305, in wrapped return func(*args, **kwargs) File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer_controller.py", line 200, in start_learning self._save_models() File "d:\python\python37\lib\site-packages\mlagents_envs\timers.py", line 305, in wrapped return func(*args, **kwargs) File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer_controller.py", line 80, in _save_models self.trainers[brain_name].save_model() File "d:\python\python37\lib\site-packages\mlagents\trainers\ghost\trainer.py", line 320, in save_model self.trainer.save_model() File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer\rl_trainer.py", line 181, in save_model model_checkpoint = self._checkpoint() File "d:\python\python37\lib\site-packages\mlagents_envs\timers.py", line 305, in wrapped return func(*args, **kwargs) File "d:\python\python37\lib\site-packages\mlagents\trainers\trainer\rl_trainer.py", line 155, in _checkpoint checkpoint_path = self.model_saver.save_checkpoint(self.brain_name, self.step) File "d:\python\python37\lib\site-packages\mlagents\trainers\model_saver\torch_model_saver.py", line 56, in save_checkpoint torch.save(state_dict, os.path.join(self.model_path, "checkpoint.pt")) File "d:\python\python37\lib\site-packages\torch\serialization.py", line 369, in save with _open_file_like(f, 'wb') as opened_file: File "d:\python\python37\lib\site-packages\torch\serialization.py", line 230, in _open_file_like return _open_file(name_or_buffer, mode) File "d:\python\python37\lib\site-packages\torch\serialization.py", line 211, in __init__ super(_open_file, self).__init__(open(name, mode)) OSError: [Errno 22] Invalid argument: 'results\\one\\Balance\\checkpoint.pt'
i adjusted rewards so i dont get big negatives and it didnt reproduced since, not sure if related or just random thing that caused the crash.
Hi, please post more information like your: - Training configuration - unity logs - action/observation space - actuators/sensors you are using - the command used when you invoked mlagents-learn Thank you!