hidden_size: 32 expert: strong_branch n_episodes: 50 n_samples: 100000 n_epochs: 100 lr: 1e-3 seed: 0 expert_probability: 0.05 sample_prob: 0.3