Example #1
0
parser.add_argument('--learning-rate', type=float, default=0.0001)
parser.add_argument('--gpu-num', type=int, default=0)
args = parser.parse_args()

build_directory_structure(
    '.', {
        args.run_dir: {
            args.name: {
                'autoencoder': {},
                'correlation': {},
                'policies': {}
            }
        }
    })

LOG.setup(os.path.join('.', args.run_dir, args.name))

env = SimpleGridworld()
dummy_env = SimpleGridworld()
net = IndepFeatureLearner(lmbda=args.lmbda,
                          learning_rate=args.learning_rate,
                          gpu_num=args.gpu_num)
buffer = replay_buffer.ReplayBuffer(10000)

visualization_freq = 10000
batch_size = args.batch_size


def run_training_step(buffer: replay_buffer.ReplayBuffer,
                      net: IndepFeatureLearner):
    positions, _, _, _, _ = buffer.sample(batch_size)