File size: 361 Bytes
fccc682
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
{
    "num_features": 32768,
    "num_layers": 12,
    "d_model": 768,
    "activation_fn": "topk",
    "topk_k": 16,
    "topk_straight_through": true,
    "topk_mode": "per_layer",
    "decoder_tying": "per_target",
    "enable_feature_offset": false,
    "enable_feature_scale": false,
    "skip_connection": false,
    "normalization_method": "mean_std"
  }