diff --git a/main.py b/main.py index e05867d..6ed86e3 100755 --- a/main.py +++ b/main.py @@ -1,5 +1,5 @@ import torch - +import numpy as np import helpers from environment import CarRacingEnv from trainer import Trainer @@ -22,6 +22,13 @@ 'train': True } + # Reproducibility: manual seeding + seed = 7081960 + torch.manual_seed(seed) + torch.cuda.manual_seed(seed) + np.random.seed(seed) + + env = CarRacingEnv(device, hyperparams['stack_frames'], hyperparams['train']) helpers.display_start() if hyperparams['train']: diff --git a/params/policy-params.dl b/params/policy-params.dl index d75bdb8..bbb4a34 100644 Binary files a/params/policy-params.dl and b/params/policy-params.dl differ diff --git a/runs/Apr14_12-13-13_ubuntu-jp/events.out.tfevents.1618395193.ubuntu-jp.3086.0 b/runs/Apr14_12-13-13_ubuntu-jp/events.out.tfevents.1618395193.ubuntu-jp.3086.0 new file mode 100644 index 0000000..d053f44 Binary files /dev/null and b/runs/Apr14_12-13-13_ubuntu-jp/events.out.tfevents.1618395193.ubuntu-jp.3086.0 differ