Spaces:
Running
Running
File size: 2,732 Bytes
85ab89d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 |
{ "run": { "task": "image_text_pretrain", "lr_sched": "linear_warmup_cosine_lr", "init_lr": 1e-05, "min_lr": 1e-06, "warmup_lr": 1e-06, "weight_decay": 0.05, "max_epoch": 10, "batch_size_train": 1, "batch_size_eval": 1, "num_workers": 12, "warmup_steps": 5000, "seed": 42, "output_dir": "ft/Llama-2-7b-chat-hf/", "amp": true, "resume_ckpt_path": null, "evaluate": false, "train_splits": [ "train" ], "device": "cuda", "world_size": 1, "dist_url": "env://", "distributed": true, "stage": 2, "rank": 0, "gpu": 0, "dist_backend": "nccl" }, "model": { "arch": "mini_gpt4", "image_size": 224, "drop_path_rate": 0, "use_grad_checkpoint": false, "vit_precision": "fp16", "freeze_vit": true, "freeze_qformer": true, "num_query_token": 32, "llama_model": "/home/ubuntu/ckpt/hf/Llama-2-7b-chat-hf/", "prompt": "", "model_type": "pretrain_vicuna", "max_txt_len": 256, "end_sym": "###", "prompt_template": "###Human: {} ###Assistant: ", "ckpt": "/home/ubuntu/proteinchat/minigpt4/output/Llama-2-7b-chat-hf/20240606005/checkpoint_2.pth" }, "preprocess": { "vis_processor": { "train": { "name": "blip2_image_train", "image_size": 224 }, "eval": { "name": "blip2_image_eval", "image_size": 224 } }, "text_processor": { "train": { "name": "blip_caption" }, "eval": { "name": "blip_caption" } } }, "datasets": { "cc_sbu_align": { "data_type": "images", "build_info": { "storage": "PATH_TO_$cc_sbu_align" }, "vis_processor": { "train": { "name": "blip2_image_train", "image_size": 224 } }, "text_processor": { "train": { "name": "blip_caption" } } } } } {"train_lr": "0.000", "train_loss": "1.280"} {"train_lr": "0.000", "train_loss": "0.805"} {"train_lr": "0.000", "train_loss": "0.756"} {"train_lr": "0.000", "train_loss": "0.727"} {"train_lr": "0.000", "train_loss": "0.704"} {"train_lr": "0.000", "train_loss": "0.682"} {"train_lr": "0.000", "train_loss": "0.664"} {"train_lr": "0.000", "train_loss": "0.648"} |