MIST / config.json
grgera's picture
Push model using huggingface_hub.
97ff799 verified
raw
history blame contribute delete
402 Bytes
{
"license": "mit",
"max_input_dim": 64,
"n_dec_layers": 1,
"n_inds": 32,
"n_phi_heads": 16,
"n_phi_layers": 2,
"n_rho_layers": 3,
"n_seeds": 10,
"output_dim": 1,
"phi_activation_fun": "gelu",
"phi_dim_forward": 1024,
"phi_hidden_dim": 256,
"phi_model": "set_transformer",
"quantile_conditioned": false,
"repo_url": null,
"rho_hidden_dim": 256,
"sab_stack_layers": 2
}