dataset_params: path: datasets/collected_data.h5 batch_size: 64 agent_params: learning_rate: 0.001 discount_factor: 0.99