| { |
| "init_opt": null, |
| "show_advanced_args": false, |
| "task": "interactive", |
| "datatype": "test", |
| "image_mode": "raw", |
| "numthreads": 1, |
| "hide_labels": false, |
| "batchsize": 128, |
| "dynamic_batching": null, |
| "datapath": "ParlAI/data", |
| "model": "transformer/generator", |
| "model_file": "ParlAI/data/models/blender/blender_3B/model", |
| "init_model": "/checkpoint/parlai/zoo/meena/20200319_meenav0data_tall_2.7B_adamoptimizer/20200319_13.3ppl_200kupdates/model", |
| "dict_class": "parlai.core.dict:DictionaryAgent", |
| "evaltask": null, |
| "eval_batchsize": null, |
| "display_examples": false, |
| "num_epochs": -1, |
| "max_train_time": 27647.999999999996, |
| "validation_every_n_secs": -1, |
| "save_every_n_secs": -1, |
| "save_after_valid": true, |
| "validation_every_n_epochs": 0.25, |
| "validation_max_exs": -1, |
| "short_final_eval": false, |
| "validation_patience": 10, |
| "validation_metric": "ppl", |
| "validation_metric_mode": "min", |
| "validation_cutoff": 1.0, |
| "validation_share_agent": false, |
| "metrics": "default", |
| "aggregate_micro": false, |
| "tensorboard_log": false, |
| "dict_maxexs": -1, |
| "dict_include_valid": false, |
| "dict_include_test": false, |
| "log_every_n_secs": 10.0, |
| "image_size": 256, |
| "image_cropsize": 224, |
| "label_type": "response", |
| "include_knowledge": true, |
| "include_checked_sentence": true, |
| "include_knowledge_separator": false, |
| "num_topics": 5, |
| "train_experiencer_only": false, |
| "remove_political_convos": false, |
| "embedding_size": 2560, |
| "n_layers": 2, |
| "ffn_size": 10240, |
| "dropout": 0.1, |
| "attention_dropout": 0.0, |
| "relu_dropout": 0.0, |
| "n_heads": 32, |
| "learn_positional_embeddings": false, |
| "embeddings_scale": true, |
| "n_positions": 128, |
| "n_segments": 0, |
| "variant": "prelayernorm", |
| "activation": "gelu", |
| "output_scaling": 1.0, |
| "share_word_embeddings": true, |
| "n_encoder_layers": 2, |
| "n_decoder_layers": 24, |
| "model_parallel": true, |
| "beam_size": 20, |
| "beam_min_length": 20, |
| "beam_context_block_ngram": 3, |
| "beam_block_ngram": 3, |
| "beam_length_penalty": 0.65, |
| "skip_generation": false, |
| "inference": "topk", |
| "topk": 40, |
| "topp": 0.9, |
| "beam_delay": 30, |
| "temperature": 1.0, |
| "compute_tokenized_bleu": false, |
| "embedding_type": "random", |
| "embedding_projection": "random", |
| "fp16": true, |
| "fp16_impl": "mem_efficient", |
| "force_fp16_tokens": true, |
| "optimizer": "mem_eff_adam", |
| "learningrate": 7e-06, |
| "gradient_clip": 0.1, |
| "adam_eps": 1e-08, |
| "adafactor_eps": [ |
| 1e-30, |
| 0.001 |
| ], |
| "momentum": 0, |
| "nesterov": true, |
| "nus": [ |
| 0.7 |
| ], |
| "betas": [ |
| 0.9, |
| 0.999 |
| ], |
| "weight_decay": null, |
| "rank_candidates": false, |
| "truncate": 128, |
| "text_truncate": 128, |
| "label_truncate": 128, |
| "history_size": -1, |
| "person_tokens": false, |
| "split_lines": false, |
| "use_reply": "label", |
| "add_p1_after_newln": false, |
| "delimiter": " ", |
| "history_add_global_end_token": "end", |
| "gpu": -1, |
| "no_cuda": false, |
| "dict_file": "ParlAI/data/models/blender/blender_3B/model.dict", |
| "dict_initpath": null, |
| "dict_language": "english", |
| "dict_max_ngram_size": -1, |
| "dict_minfreq": 0, |
| "dict_maxtokens": -1, |
| "dict_nulltoken": "__null__", |
| "dict_starttoken": "__start__", |
| "dict_endtoken": "__end__", |
| "dict_unktoken": "__unk__", |
| "dict_tokenizer": "bytelevelbpe", |
| "dict_lower": false, |
| "bpe_debug": false, |
| "dict_textfields": "text,labels", |
| "bpe_vocab": "ParlAI/data/models/blender/blender_3B/model.dict-vocab.json", |
| "bpe_merge": "ParlAI/data/models/blender/blender_3B/model.dict-merges.txt", |
| "bpe_add_prefix_space": true, |
| "lr_scheduler": "reduceonplateau", |
| "lr_scheduler_patience": 3, |
| "lr_scheduler_decay": 0.5, |
| "max_lr_steps": -1, |
| "invsqrt_lr_decay_gamma": -1, |
| "warmup_updates": 100, |
| "warmup_rate": 0.0001, |
| "update_freq": 2, |
| "parlai_home": "ParlAI/", |
| "starttime": "Mar31_06-04", |
| "beam_block_full_context": false, |
| "batchindex": 127, |
| "dict_loaded": true |
| } |
|
|