bobox's picture
n_layers_per_step = 1, last_layer_weight = 1.5 * model_layers,, prior_layers_weight= 1, kl_div_weight = 2, kl_temperature= 1,
554d487 verified
raw
history blame contribute delete
296 Bytes
{
"word_embedding_dimension": 768,
"pooling_mode_cls_token": false,
"pooling_mode_mean_tokens": true,
"pooling_mode_max_tokens": false,
"pooling_mode_mean_sqrt_len_tokens": false,
"pooling_mode_weightedmean_tokens": false,
"pooling_mode_lasttoken": false,
"include_prompt": true
}