flant5-few-shottttt / config.json
cti-ttp-18's picture
Training in progress, epoch 1
b724545 verified
{
"_name_or_path": "google/flan-t5-base",
"architectures": [
"T5ForSequenceClassification"
],
"classifier_dropout": 0.0,
"d_ff": 2048,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "gelu_new",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "gated-gelu",
"id2label": {
"0": "t1497virtualization/sandboxevasion",
"1": "t1082systeminformationdiscovery",
"2": "t1059commandandscriptinginterpreter",
"3": "t1486dataencryptedforimpact",
"4": "t1105ingresstooltransfer",
"5": "t1021remoteservices",
"6": "t0814denialofservice",
"7": "t1562impairdefenses",
"8": "t1055processinjection",
"9": "t1566phishing",
"10": "t1003oscredentialdumping",
"11": "t1027obfuscatedfilesorinformation",
"12": "t1018remotesystemdiscovery",
"13": "t1047windowsmanagementinstrumentation",
"14": "t1053scheduledtask/job"
},
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": true,
"label2id": {
"t0814denialofservice": 6,
"t1003oscredentialdumping": 10,
"t1018remotesystemdiscovery": 12,
"t1021remoteservices": 5,
"t1027obfuscatedfilesorinformation": 11,
"t1047windowsmanagementinstrumentation": 13,
"t1053scheduledtask/job": 14,
"t1055processinjection": 8,
"t1059commandandscriptinginterpreter": 2,
"t1082systeminformationdiscovery": 1,
"t1105ingresstooltransfer": 4,
"t1486dataencryptedforimpact": 3,
"t1497virtualization/sandboxevasion": 0,
"t1562impairdefenses": 7,
"t1566phishing": 9
},
"layer_norm_epsilon": 1e-06,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"problem_type": "multi_label_classification",
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"tie_word_embeddings": false,
"torch_dtype": "float32",
"transformers_version": "4.39.2",
"use_cache": true,
"vocab_size": 32128
}