experiment: training: hidden_size: 64 expert: strong_branch problem: setcover n_rows: 500 n_cols: 500 density: 0.05