env:
scenario: 0
target_price: 100
threshold_price: 120
dataset_params:
path: datasets/collected_data.h5
batch_size: 64
agent:
learning_rate: 0.001
discount_factor: 0.99