env: scenario: 0 target_price: 100 threshold_price: 120 dataset_params: path: datasets/collected_data.h5 batch_size: 64 agent: learning_rate: 0.001 discount_factor: 0.99