MaskedLMTask.ConfigΒΆ
Component: MaskedLMTask
-
class
MaskedLMTask.
Config
[source] Bases:
NewTask.Config
All Attributes (including base classes)
- data: Data.Config = PackedLMData.Config()
- trainer: TaskTrainer.Config = TaskTrainer.Config()
- use_elastic: Optional[bool] =
None
- model: MaskedLanguageModel.Config = MaskedLanguageModel.Config()
- metric_reporter: MaskedLMMetricReporter.Config = MaskedLMMetricReporter.Config()
Default JSON
{
"data": {
"PackedLMData": {
"source": {
"TSVDataSource": {
"column_mapping": {},
"train_filename": null,
"test_filename": null,
"eval_filename": null,
"field_names": null,
"delimiter": "\t",
"quoted": false,
"drop_incomplete_rows": false
}
},
"batcher": {
"PoolingBatcher": {
"train_batch_size": 16,
"eval_batch_size": 16,
"test_batch_size": 16,
"pool_num_batches": 1000,
"num_shuffled_pools": 1
}
},
"sort_key": null,
"in_memory": true,
"max_seq_len": 128
}
},
"trainer": {
"TaskTrainer": {
"epochs": 10,
"early_stop_after": 0,
"max_clip_norm": null,
"report_train_metrics": true,
"target_time_limit_seconds": null,
"do_eval": true,
"load_best_model_after_train": true,
"num_samples_to_log_progress": 1000,
"num_accumulated_batches": 1,
"num_batches_per_epoch": null,
"optimizer": {
"Adam": {
"lr": 0.001,
"weight_decay": 1e-05,
"eps": 1e-08
}
},
"scheduler": null,
"sparsifier": null,
"fp16_args": {
"FP16OptimizerFairseq": {
"init_loss_scale": 128,
"scale_window": null,
"scale_tolerance": 0.0,
"threshold_loss_scale": null,
"min_loss_scale": 0.0001
}
},
"privacy_engine": null,
"use_tensorboard": false
}
},
"use_elastic": null,
"model": {
"inputs": {
"tokens": {
"BERTTensorizerBase": {
"is_input": true,
"columns": [
"text"
],
"tokenizer": {
"Tokenizer": {
"split_regex": "\\s+",
"lowercase": true,
"use_byte_offsets": false
}
},
"base_tokenizer": null,
"vocab_file": "",
"max_seq_len": 128
}
}
},
"encoder": {
"TransformerSentenceEncoder": {
"load_path": null,
"save_path": null,
"freeze": false,
"shared_module_key": null,
"output_dropout": 0.4,
"embedding_dim": 768,
"pooling": "cls_token",
"export": false,
"projection_dim": 0,
"normalize_output_rep": false,
"dropout": 0.1,
"attention_dropout": 0.1,
"activation_dropout": 0.1,
"ffn_embedding_dim": 3072,
"num_encoder_layers": 6,
"num_attention_heads": 8,
"num_segments": 2,
"use_position_embeddings": true,
"offset_positions_by_padding": true,
"apply_bert_init": true,
"encoder_normalize_before": true,
"activation_fn": "relu",
"max_seq_len": 128,
"multilingual": false,
"freeze_embeddings": false,
"n_trans_layers_to_freeze": 0,
"use_torchscript": false,
"use_bias_finetuning": false
}
},
"decoder": {
"load_path": null,
"save_path": null,
"freeze": false,
"shared_module_key": null,
"hidden_dims": [],
"out_dim": null,
"layer_norm": false,
"dropout": 0.0,
"bias": true,
"activation": "relu",
"temperature": 1.0,
"spectral_normalization": false
},
"output_layer": {
"load_path": null,
"save_path": null,
"freeze": false,
"shared_module_key": null,
"loss": {}
},
"mask_prob": 0.15,
"mask_bos": false,
"masking_strategy": "random",
"tie_weights": true
},
"metric_reporter": {
"output_path": "/tmp/test_out.txt",
"pep_format": false,
"student_column_names": [],
"log_gradient": false,
"aggregate_metrics": true,
"perplexity_type": "median"
}
}