{ "vocab_size": 50258, "emb_size": 256, "nhead": 8, "num_encoder_layers": 4, "num_decoder_layers": 4, "dim_feedforward": 1024, "dropout": 0.1, "max_text_len": 128, "max_coord_len": 11, "max_waypoints": 10, "num_count_classes": 11, "architecture": "Seq2SeqCoordsTransformer" }