New Page
{
"dataset_reader": {
"type": "transformer_squad",
"length_limit": 512,
"transformer_model_name": "roberta-large"
},
"model": {
"type": "transformer_qa",
"transformer_model_name": "roberta-large"
},
"train_data_path": "https://allennlp.s3.amazonaws.com/datasets/squad/squad-train-v2.0.json",
"validation_data_path": "https://allennlp.s3.amazonaws.com/datasets/squad/squad-dev-v2.0.json",
"trainer": {
"callbacks": [
"tensorboard"
],
"grad_clipping": 1,
"learning_rate_scheduler": {
"type": "slanted_triangular",
"cut_frac": 0.1,
"num_epochs": 5
},
"num_epochs": 5,
"num_gradient_accumulation_steps": 2,
"optimizer": {
"type": "huggingface_adamw",
"eps": 1e-08,
"lr": 2e-05,
"parameter_groups": [
[
[
"bias",
"LayerNorm\\.weight",
"layer_norm\\.weight"
],
{
"weight_decay": 0
}
]
],
"weight_decay": 0
},
"validation_metric": "+per_instance_f1"
},
"vocabulary": {
"type": "empty"
},
"data_loader": {
"batch_sampler": {
"type": "bucket",
"batch_size": 8
}
},
"numpy_seed": 100,
"pytorch_seed": 100,
"random_seed": 100
}
No Comments