sac: {
    actor_learning_rate: 3e-4,
    critic_learning_rate: 3e-4,
    temp_learning_rate: 3e-4,
    batch_size: 256,