File size: 2,732 Bytes
85ab89d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
{
    "run": {
        "task": "image_text_pretrain",
        "lr_sched": "linear_warmup_cosine_lr",
        "init_lr": 1e-05,
        "min_lr": 1e-06,
        "warmup_lr": 1e-06,
        "weight_decay": 0.05,
        "max_epoch": 10,
        "batch_size_train": 1,
        "batch_size_eval": 1,
        "num_workers": 12,
        "warmup_steps": 5000,
        "seed": 42,
        "output_dir": "ft/Llama-2-7b-chat-hf/",
        "amp": true,
        "resume_ckpt_path": null,
        "evaluate": false,
        "train_splits": [
            "train"
        ],
        "device": "cuda",
        "world_size": 1,
        "dist_url": "env://",
        "distributed": true,
        "stage": 2,
        "rank": 0,
        "gpu": 0,
        "dist_backend": "nccl"
    },
    "model": {
        "arch": "mini_gpt4",
        "image_size": 224,
        "drop_path_rate": 0,
        "use_grad_checkpoint": false,
        "vit_precision": "fp16",
        "freeze_vit": true,
        "freeze_qformer": true,
        "num_query_token": 32,
        "llama_model": "/home/ubuntu/ckpt/hf/Llama-2-7b-chat-hf/",
        "prompt": "",
        "model_type": "pretrain_vicuna",
        "max_txt_len": 256,
        "end_sym": "###",
        "prompt_template": "###Human: {} ###Assistant: ",
        "ckpt": "/home/ubuntu/proteinchat/minigpt4/output/Llama-2-7b-chat-hf/20240606005/checkpoint_2.pth"
    },
    "preprocess": {
        "vis_processor": {
            "train": {
                "name": "blip2_image_train",
                "image_size": 224
            },
            "eval": {
                "name": "blip2_image_eval",
                "image_size": 224
            }
        },
        "text_processor": {
            "train": {
                "name": "blip_caption"
            },
            "eval": {
                "name": "blip_caption"
            }
        }
    },
    "datasets": {
        "cc_sbu_align": {
            "data_type": "images",
            "build_info": {
                "storage": "PATH_TO_$cc_sbu_align"
            },
            "vis_processor": {
                "train": {
                    "name": "blip2_image_train",
                    "image_size": 224
                }
            },
            "text_processor": {
                "train": {
                    "name": "blip_caption"
                }
            }
        }
    }
}
{"train_lr": "0.000", "train_loss": "1.280"}
{"train_lr": "0.000", "train_loss": "0.805"}
{"train_lr": "0.000", "train_loss": "0.756"}
{"train_lr": "0.000", "train_loss": "0.727"}
{"train_lr": "0.000", "train_loss": "0.704"}
{"train_lr": "0.000", "train_loss": "0.682"}
{"train_lr": "0.000", "train_loss": "0.664"}
{"train_lr": "0.000", "train_loss": "0.648"}