| { | |
| "dataset_reader": { | |
| "type": "text_classification_json", | |
| "token_indexers": { | |
| "tokens": { | |
| "type": "single_id", | |
| "namespace": "tokens", | |
| "lowercase_tokens": true, | |
| "token_min_padding_length": 5 | |
| } | |
| }, | |
| "tokenizer": { | |
| "type": "pretrained_transformer", | |
| "model_name": "google-bert/bert-base-multilingual-uncased" | |
| }, | |
| "max_sequence_length": 256 | |
| }, | |
| "train_data_path": "train.json", | |
| "validation_data_path": "valid.json", | |
| "vocabulary": { | |
| "directory_path": "vocabulary" | |
| }, | |
| "model": { | |
| "type": "basic_classifier", | |
| "text_field_embedder": { | |
| "token_embedders": { | |
| "tokens": { | |
| "type": "embedding", | |
| "num_embeddings": 105880, | |
| "embedding_dim": 64 | |
| } | |
| } | |
| }, | |
| "seq2seq_encoder": { | |
| "type": "pass_through", | |
| "input_dim": 64 | |
| }, | |
| "seq2vec_encoder": { | |
| "type": "bag_of_embeddings", | |
| "embedding_dim": 64 | |
| } | |
| }, | |
| "data_loader": { | |
| "type": "multiprocess", | |
| "batch_size": 64, | |
| "shuffle": true | |
| }, | |
| "trainer": { | |
| "type": "gradient_descent", | |
| "cuda_device": -1, | |
| "optimizer": { | |
| "type": "bert_adam", | |
| "lr": 5e-05, | |
| "warmup": 0.1, | |
| "t_total": 50000, | |
| "schedule": "warmup_linear" | |
| }, | |
| "checkpointer": { | |
| "serialization_dir": "serialization_dir", | |
| "keep_most_recent_by_count": 10 | |
| }, | |
| "patience": 5, | |
| "validation_metric": "+accuracy", | |
| "num_epochs": 100 | |
| } | |
| } |