Advertisement
Guest User

Untitled

a guest
Nov 15th, 2019
137
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
JSON 3.31 KB | None | 0 0
  1. {
  2.   "dataset_reader": {
  3.     "type": "squad",
  4.     "lazy": true,
  5.     "passage_length_limit": 400,
  6.     "tokenizer": {
  7.       "type": "word",
  8.       "word_splitter": {
  9.         "type": "spacy",
  10.         "pos_tags": true,
  11.         "ner": true
  12.       }
  13.     },
  14.     "token_indexers": {
  15.       "token_characters": {
  16.         "type": "characters",
  17.         "min_padding_length": 3
  18.       },
  19.       "bert": {
  20.           "type": "bert-pretrained",
  21.           "pretrained_model": "bert-base-uncased",
  22.           "do_lowercase": true,
  23.           "use_starting_offsets": true
  24.       },
  25.       "pos_tag": {
  26.         "type": "pos_tag"
  27.       },
  28.       "ner_tag": {
  29.         "type": "ner_tag"
  30.       }
  31.     }
  32.   },
  33.   "train_data_path": "dev-v2.0.json",
  34.   "validation_data_path": "dev-v2.0.json",
  35.   "model": {
  36.     "type": "slqa",
  37.     "word_embedder": {
  38.       "embedder_to_indexer_map": {
  39.             "bert": ["bert", "bert-offsets"],
  40.             "token_characters": ["token_characters"],
  41.         },
  42.       "token_embedders": {
  43.           "bert": {
  44.             "type": "bert-pretrained",
  45.             "pretrained_model": "bert-base-uncased",
  46.           },
  47.           "token_characters": {
  48.             "type": "character_encoding",
  49.             "embedding": {
  50.               "embedding_dim": 16,
  51.             },
  52.             "encoder": {
  53.               "type": "cnn",
  54.               "embedding_dim": 16,
  55.               "num_filters": 128,
  56.               "ngram_filter_sizes": [3],
  57.               "conv_layer_activation": "relu"
  58.             }
  59.           }
  60.       },
  61.       "allow_unmatched_keys": true
  62.     },
  63.     "phrase_layer": {
  64.       "type": "lstm",
  65.       "bidirectional": true,
  66.       "input_size": 896,
  67.       "hidden_size": 100,
  68.       "num_layers": 1,
  69.       "dropout": 0.4
  70.     },
  71.     "features_embedder": {
  72.       "embedder_to_indexer_map": {
  73.             "pos_tag": ["pos_tag"],
  74.             "ner_tag": ["ner_tag"],
  75.         },
  76.       "pos_tag": {
  77.         "type": "embedding",
  78.         "embedding_dim": 16,
  79.         "trainable": false
  80.       },
  81.       "ner_tag": {
  82.         "type": "embedding",
  83.         "embedding_dim": 16,
  84.         "trainable": false
  85.       },
  86.       "allow_unmatched_keys": true
  87.     },
  88.     "projected_layer": {
  89.       "type": "lstm",
  90.       "bidirectional": true,
  91.       "input_size": 200,
  92.       "hidden_size": 100,
  93.       "num_layers": 1,
  94.       "dropout": 0.4
  95.     },
  96.     "contextual_passage": {
  97.       "type": "lstm",
  98.       "bidirectional": true,
  99.       "input_size": 200,
  100.       "hidden_size": 100,
  101.       "num_layers": 1,
  102.       "dropout": 0.4
  103.     },
  104.     "contextual_question": {
  105.       "type": "lstm",
  106.       "bidirectional": true,
  107.       "input_size": 200,
  108.       "hidden_size": 100,
  109.       "num_layers": 1,
  110.       "dropout": 0.4
  111.     },
  112.     "dropout": 0.4
  113.   },
  114.   "iterator": {
  115.     "type": "bucket",
  116.     "sorting_keys": [["passage", "num_tokens"], ["question", "num_tokens"]],
  117.     "batch_size": 32,
  118.     "max_instances_in_memory": 32
  119.   },
  120.   "trainer": {
  121.     "num_epochs": 50,
  122.     "grad_norm": 5.0,
  123.     "patience": 10,
  124.     "validation_metric": "+f1",
  125.     "cuda_device": 0,
  126.     "learning_rate_scheduler":  {
  127.       "type": "reduce_on_plateau",
  128.       "factor": 0.5,
  129.       "mode": "max",
  130.       "patience": 2,
  131.  
  132.     },
  133.     "optimizer": {
  134.       "type": "adamax",
  135.       // "betas": [0.9, 0.9],
  136.       "lr": 0.002
  137.     }
  138.   }
  139. }
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement