td3: {
    actor_learning_rate: 3e-4,
    critic_learning_rate: 3e-4,
    batch_size: 256,
    tau: 0.005,