daje commited on
Commit
16fea24
·
1 Parent(s): da7217d

Upload model.opt

Browse files
Files changed (1) hide show
  1. model.opt +1 -0
model.opt ADDED
@@ -0,0 +1 @@
 
 
1
+ {"init_opt": null, "show_advanced_args": false, "task": "convai2", "download_path": "/private/home/edinan/ParlAI/downloads", "datatype": "train", "image_mode": "raw", "numthreads": 1, "hide_labels": false, "multitask_weights": [1], "batchsize": 2, "datapath": "/private/home/edinan/ParlAI/data", "model": "transformer/polyencoder", "model_file": "/private/home/edinan/ParlAI/data/models/pretrained_transformers/poly_model_huge_reddit.mdl", "init_model": null, "dict_class": "parlai.core.dict:DictionaryAgent", "local_human_candidates_file": null, "single_turn": false, "image_size": 256, "image_cropsize": 224, "embedding_type": "random", "embedding_projection": "random", "fp16": true, "optimizer": "adamax", "learningrate": 5e-05, "gradient_clip": 0.1, "momentum": 0, "nesterov": true, "nus": [0.7], "betas": [0.9, 0.999], "weight_decay": null, "lr_scheduler": "reduceonplateau", "lr_scheduler_patience": 0, "lr_scheduler_decay": 0.4, "warmup_updates": 100, "warmup_rate": 0.0001, "update_freq": 1, "rank_candidates": true, "truncate": 1024, "text_truncate": 360, "label_truncate": 72, "history_size": 20, "person_tokens": false, "split_lines": false, "use_reply": "label", "add_p1_after_newln": false, "delimiter": "\n", "gpu": -1, "no_cuda": false, "candidates": "batch", "eval_candidates": "inline", "repeat_blocking_heuristic": true, "fixed_candidates_path": null, "fixed_candidate_vecs": "reuse", "encode_candidate_vecs": false, "train_predict": false, "cap_num_predictions": 100, "ignore_bad_candidates": false, "embedding_size": 768, "n_layers": 12, "ffn_size": 3072, "dropout": 0.1, "attention_dropout": 0.1, "relu_dropout": 0.0, "n_heads": 12, "learn_positional_embeddings": true, "embeddings_scale": false, "n_positions": 1024, "n_segments": 2, "variant": "xlm", "activation": "gelu", "output_scaling": 0.06, "use_memories": false, "wrap_memory_encoder": false, "memory_attention": "sqrt", "normalize_sent_emb": false, "share_encoders": false, "share_word_embeddings": true, "learn_embeddings": true, "data_parallel": true, "reduction_type": "mean", "dict_file": "./data/models/pretrained_transformers/model_bi.dict", "dict_initpath": null, "dict_language": "english", "dict_max_ngram_size": -1, "dict_minfreq": 0, "dict_maxtokens": -1, "dict_nulltoken": "__null__", "dict_starttoken": "__start__", "dict_endtoken": "__start__", "dict_unktoken": "__unk__", "dict_tokenizer": "bpe", "dict_lower": true, "bpe_debug": false, "dict_textfields": "text,labels", "polyencoder_type": "n_first", "poly_n_codes": 64, "poly_attention_type": "basic", "poly_attention_num_heads": 4, "codes_attention_type": "basic", "codes_attention_num_heads": 4, "parlai_home": "/private/home/edinan/ParlAI", "override": {"model_file": "/private/home/edinan/ParlAI/data/models/pretrained_transformers/poly_model_huge_reddit.mdl", "dict_file": "./data/models/pretrained_transformers/model_bi.dict", "task": "convai2", "model": "transformer/polyencoder", "batchsize": 2, "lr_scheduler_patience": 0, "lr_scheduler_decay": 0.4, "learningrate": 5e-05, "data_parallel": true, "history_size": 20, "label_truncate": 72, "text_truncate": 360, "candidates": "batch", "fp16": true, "dict_tokenizer": "bpe", "dict_lower": true, "optimizer": "adamax", "output_scaling": 0.06, "variant": "xlm", "reduction_type": "mean", "share_encoders": false, "learn_positional_embeddings": true, "n_layers": 12, "n_heads": 12, "ffn_size": 3072, "attention_dropout": 0.1, "relu_dropout": 0.0, "dropout": 0.1, "n_positions": 1024, "embedding_size": 768, "activation": "gelu", "embeddings_scale": false, "n_segments": 2, "learn_embeddings": true, "polyencoder_type": "n_first", "poly_n_codes": 64, "poly_attention_type": "basic", "dict_endtoken": "__start__"}, "starttime": "Jul12_08-39"}