{ "dataset_reader":{ "type":"universal_dependencies" }, "train_data_path": std.extVar("PTB_DEPENDENCIES_TRAIN"), "validation_data_path": std.extVar("PTB_DEPENDENCIES_VAL"), "model": { "type": "biaffine_parser", "text_field_embedder": { "token_embedders": { "tokens": { "type": "embedding", "embedding_dim": 100, "pretrained_file": "https://allennlp.s3.amazonaws.com/datasets/glove/glove.6B.100d.txt.gz", "trainable": true, "sparse": true } } }, "pos_tag_embedding":{ "embedding_dim": 100, "vocab_namespace": "pos", "sparse": true }, "encoder": { "type": "stacked_bidirectional_lstm", "input_size": 200, "hidden_size": 400, "num_layers": 3, "recurrent_dropout_probability": 0.3, "use_highway": true }, "use_mst_decoding_for_validation": true, "arc_representation_dim": 500, "tag_representation_dim": 100, "dropout": 0.3, "input_dropout": 0.3, "initializer": { "regexes": [ [".*projection.*weight", {"type": "xavier_uniform"}], [".*projection.*bias", {"type": "zero"}], [".*tag_bilinear.*weight", {"type": "xavier_uniform"}], [".*tag_bilinear.*bias", {"type": "zero"}], [".*weight_ih.*", {"type": "xavier_uniform"}], [".*weight_hh.*", {"type": "orthogonal"}], [".*bias_ih.*", {"type": "zero"}], [".*bias_hh.*", {"type": "lstm_hidden_bias"}] ] } }, "data_loader": { "batch_sampler": { "type": "bucket", "batch_size" : 128 } }, "trainer": { "num_epochs": 50, "grad_norm": 5.0, "patience": 50, "validation_metric": "+LAS", "optimizer": { "type": "dense_sparse_adam", "betas": [0.9, 0.9] } } }