Zhang199 commited on
Commit
25e5e53
1 Parent(s): f5344d6

commit from

Browse files
added_tokens.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "<|endoftext|>": 151643,
3
+ "<|im_end|>": 151645,
4
+ "<|im_start|>": 151644
5
+ }
config.json ADDED
@@ -0,0 +1,70 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "architectures": [
3
+ "TinyLlavaForConditionalGeneration"
4
+ ],
5
+ "cache_dir": null,
6
+ "connector_type": "mlp2x_gelu",
7
+ "hidden_size": 896,
8
+ "ignore_index": -100,
9
+ "image_aspect_ratio": "square",
10
+ "image_token_index": -200,
11
+ "llm_model_name_or_path": "Qwen/Qwen2-0.5B",
12
+ "model_type": "tinyllava",
13
+ "num_queries": 128,
14
+ "num_resampler_layers": 3,
15
+ "pad_token": "<|endoftext|>",
16
+ "pad_token_id": 151643,
17
+ "resampler_hidden_size": 768,
18
+ "text_config": {
19
+ "_name_or_path": "Qwen/Qwen2-0.5B",
20
+ "architectures": [
21
+ "Qwen2ForCausalLM"
22
+ ],
23
+ "bos_token_id": 151643,
24
+ "eos_token_id": 151643,
25
+ "hidden_size": 896,
26
+ "intermediate_size": 4864,
27
+ "max_position_embeddings": 131072,
28
+ "max_window_layers": 24,
29
+ "model_type": "qwen2",
30
+ "num_attention_heads": 14,
31
+ "num_hidden_layers": 24,
32
+ "num_key_value_heads": 2,
33
+ "rope_theta": 1000000.0,
34
+ "sliding_window": 131072,
35
+ "tie_word_embeddings": true,
36
+ "torch_dtype": "float16",
37
+ "use_sliding_window": false,
38
+ "vocab_size": 151936
39
+ },
40
+ "tokenizer_model_max_length": 2048,
41
+ "tokenizer_name_or_path": "Qwen/Qwen2-0.5B",
42
+ "tokenizer_padding_side": "right",
43
+ "tokenizer_use_fast": false,
44
+ "torch_dtype": "float16",
45
+ "transformers_version": "4.39.3",
46
+ "tune_type_connector": "full",
47
+ "tune_type_llm": "full",
48
+ "tune_type_vision_tower": "frozen",
49
+ "tune_vision_tower_from_layer": 0,
50
+ "use_cache": true,
51
+ "vision_config": {
52
+ "hidden_act": "gelu_pytorch_tanh",
53
+ "hidden_size": 1152,
54
+ "image_size": 384,
55
+ "intermediate_size": 4304,
56
+ "layer_norm_eps": 1e-06,
57
+ "model_name_or_path": "google/siglip-so400m-patch14-384",
58
+ "model_name_or_path2": "",
59
+ "model_type": "siglip_vision_model",
60
+ "num_attention_heads": 16,
61
+ "num_hidden_layers": 27,
62
+ "patch_size": 14
63
+ },
64
+ "vision_feature_layer": -2,
65
+ "vision_feature_select_strategy": "patch",
66
+ "vision_hidden_size": 1152,
67
+ "vision_model_name_or_path": "google/siglip-so400m-patch14-384",
68
+ "vision_model_name_or_path2": "",
69
+ "vocab_size": 151936
70
+ }
generation_config.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 151643,
4
+ "eos_token_id": 151643,
5
+ "transformers_version": "4.39.3",
6
+ "use_cache": false
7
+ }
log.txt ADDED
@@ -0,0 +1,77 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2024-07-16 15:40:33,688 | INFO: Total Parameters: 924095168, Total Trainable Parameters: 495869568
2
+ 2024-07-16 15:40:33,688 | INFO: Trainable Parameters:
3
+ 2024-07-16 15:40:33,695 | WARNING: Detected kernel version 3.10.0, which is below the recommended minimum of 5.5.0; this can cause the process to hang. It is recommended to upgrade the kernel to the minimum version or higher.
4
+ 2024-07-16 15:40:39,768 | INFO: Added key: store_based_barrier_key:2 to store for rank: 6
5
+ 2024-07-16 15:40:43,128 | INFO: Added key: store_based_barrier_key:2 to store for rank: 0
6
+ 2024-07-16 15:40:43,235 | INFO: Added key: store_based_barrier_key:2 to store for rank: 2
7
+ 2024-07-16 15:40:43,777 | INFO: Added key: store_based_barrier_key:2 to store for rank: 5
8
+ 2024-07-16 15:40:44,174 | INFO: Added key: store_based_barrier_key:2 to store for rank: 4
9
+ 2024-07-16 15:40:44,799 | INFO: Added key: store_based_barrier_key:2 to store for rank: 1
10
+ 2024-07-16 15:40:45,214 | INFO: Added key: store_based_barrier_key:2 to store for rank: 3
11
+ 2024-07-16 15:40:46,146 | INFO: Added key: store_based_barrier_key:2 to store for rank: 7
12
+ 2024-07-16 15:40:46,146 | INFO: Rank 7: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
13
+ 2024-07-16 15:40:46,149 | INFO: Rank 6: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
14
+ 2024-07-16 15:40:46,150 | INFO: Rank 0: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
15
+ 2024-07-16 15:40:46,152 | INFO: Rank 2: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
16
+ 2024-07-16 15:40:46,154 | INFO: Rank 5: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
17
+ 2024-07-16 15:40:46,155 | INFO: Rank 1: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
18
+ 2024-07-16 15:40:46,155 | INFO: Rank 3: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
19
+ 2024-07-16 15:40:46,155 | INFO: Rank 4: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
20
+ 2024-07-16 15:44:35,860 | INFO: Added key: store_based_barrier_key:2 to store for rank: 5
21
+ 2024-07-16 15:44:36,299 | INFO: Total Parameters: 924095168, Total Trainable Parameters: 495869568
22
+ 2024-07-16 15:44:36,299 | INFO: Trainable Parameters:
23
+ 2024-07-16 15:44:36,306 | WARNING: Detected kernel version 3.10.0, which is below the recommended minimum of 5.5.0; this can cause the process to hang. It is recommended to upgrade the kernel to the minimum version or higher.
24
+ 2024-07-16 15:44:39,116 | INFO: Added key: store_based_barrier_key:2 to store for rank: 2
25
+ 2024-07-16 15:44:43,212 | INFO: Added key: store_based_barrier_key:2 to store for rank: 1
26
+ 2024-07-16 15:44:43,924 | INFO: Added key: store_based_barrier_key:2 to store for rank: 7
27
+ 2024-07-16 15:44:43,926 | INFO: Added key: store_based_barrier_key:2 to store for rank: 3
28
+ 2024-07-16 15:44:44,783 | INFO: Added key: store_based_barrier_key:2 to store for rank: 6
29
+ 2024-07-16 15:44:45,226 | INFO: Added key: store_based_barrier_key:2 to store for rank: 0
30
+ 2024-07-16 15:44:45,864 | INFO: Waiting in store based barrier to initialize process group for rank: 5, key: store_based_barrier_key:2 (world_size=8, worker_count=7, timeout=0:30:00)
31
+ 2024-07-16 15:44:45,964 | INFO: Added key: store_based_barrier_key:2 to store for rank: 4
32
+ 2024-07-16 15:44:45,965 | INFO: Rank 4: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
33
+ 2024-07-16 15:44:45,965 | INFO: Rank 0: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
34
+ 2024-07-16 15:44:45,965 | INFO: Rank 2: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
35
+ 2024-07-16 15:44:45,965 | INFO: Rank 5: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
36
+ 2024-07-16 15:44:45,965 | INFO: Rank 6: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
37
+ 2024-07-16 15:44:45,967 | INFO: Rank 7: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
38
+ 2024-07-16 15:44:45,969 | INFO: Rank 3: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
39
+ 2024-07-16 15:44:45,971 | INFO: Rank 1: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
40
+ 2024-07-16 15:48:33,508 | INFO: Total Parameters: 924095168, Total Trainable Parameters: 495869568
41
+ 2024-07-16 15:48:33,508 | INFO: Trainable Parameters:
42
+ 2024-07-16 15:48:33,515 | WARNING: Detected kernel version 3.10.0, which is below the recommended minimum of 5.5.0; this can cause the process to hang. It is recommended to upgrade the kernel to the minimum version or higher.
43
+ 2024-07-16 15:48:40,753 | INFO: Added key: store_based_barrier_key:2 to store for rank: 2
44
+ 2024-07-16 15:48:42,601 | INFO: Added key: store_based_barrier_key:2 to store for rank: 1
45
+ 2024-07-16 15:48:43,084 | INFO: Added key: store_based_barrier_key:2 to store for rank: 0
46
+ 2024-07-16 15:48:43,546 | INFO: Added key: store_based_barrier_key:2 to store for rank: 6
47
+ 2024-07-16 15:48:43,832 | INFO: Added key: store_based_barrier_key:2 to store for rank: 7
48
+ 2024-07-16 15:48:43,948 | INFO: Added key: store_based_barrier_key:2 to store for rank: 4
49
+ 2024-07-16 15:48:44,337 | INFO: Added key: store_based_barrier_key:2 to store for rank: 5
50
+ 2024-07-16 15:48:44,821 | INFO: Added key: store_based_barrier_key:2 to store for rank: 3
51
+ 2024-07-16 15:48:44,821 | INFO: Rank 3: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
52
+ 2024-07-16 15:48:44,823 | INFO: Rank 5: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
53
+ 2024-07-16 15:48:44,823 | INFO: Rank 0: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
54
+ 2024-07-16 15:48:44,825 | INFO: Rank 7: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
55
+ 2024-07-16 15:48:44,828 | INFO: Rank 1: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
56
+ 2024-07-16 15:48:44,828 | INFO: Rank 2: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
57
+ 2024-07-16 15:48:44,829 | INFO: Rank 4: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
58
+ 2024-07-16 15:48:44,830 | INFO: Rank 6: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
59
+ 2024-07-16 15:51:35,846 | INFO: Total Parameters: 924095168, Total Trainable Parameters: 495869568
60
+ 2024-07-16 15:51:35,846 | INFO: Trainable Parameters:
61
+ 2024-07-16 15:51:35,852 | WARNING: Detected kernel version 3.10.0, which is below the recommended minimum of 5.5.0; this can cause the process to hang. It is recommended to upgrade the kernel to the minimum version or higher.
62
+ 2024-07-16 15:51:40,320 | INFO: Added key: store_based_barrier_key:2 to store for rank: 3
63
+ 2024-07-16 15:51:43,850 | INFO: Added key: store_based_barrier_key:2 to store for rank: 5
64
+ 2024-07-16 15:51:44,522 | INFO: Added key: store_based_barrier_key:2 to store for rank: 6
65
+ 2024-07-16 15:51:44,688 | INFO: Added key: store_based_barrier_key:2 to store for rank: 7
66
+ 2024-07-16 15:51:45,242 | INFO: Added key: store_based_barrier_key:2 to store for rank: 0
67
+ 2024-07-16 15:51:45,726 | INFO: Added key: store_based_barrier_key:2 to store for rank: 4
68
+ 2024-07-16 15:51:45,814 | INFO: Added key: store_based_barrier_key:2 to store for rank: 1
69
+ 2024-07-16 15:51:46,384 | INFO: Added key: store_based_barrier_key:2 to store for rank: 2
70
+ 2024-07-16 15:51:46,385 | INFO: Rank 2: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
71
+ 2024-07-16 15:51:46,386 | INFO: Rank 5: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
72
+ 2024-07-16 15:51:46,387 | INFO: Rank 7: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
73
+ 2024-07-16 15:51:46,387 | INFO: Rank 3: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
74
+ 2024-07-16 15:51:46,391 | INFO: Rank 1: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
75
+ 2024-07-16 15:51:46,394 | INFO: Rank 4: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
76
+ 2024-07-16 15:51:46,394 | INFO: Rank 6: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
77
+ 2024-07-16 15:51:46,394 | INFO: Rank 0: Completed store-based barrier for key:store_based_barrier_key:2 with 8 nodes.
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85811ad4c281f9aa849b0512c6bc78fb5467ee0c905d27ee95a2bbe3353ad4f4
3
+ size 2120564264
runs/Jul16_15-39-14_gpu21.buaanlsde.org/events.out.tfevents.1721115660.gpu21.buaanlsde.org ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf13ea6871157ed35533451877d7b478085f0b9e27242d2600ba732d740ee249
3
+ size 7943
runs/Jul16_15-43-12_gpu21.buaanlsde.org/events.out.tfevents.1721115898.gpu21.buaanlsde.org ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbae5a63c3cceac151462221ee2374005032d789d042820b614b56216265652f
3
+ size 6908
runs/Jul16_15-47-12_gpu21.buaanlsde.org/events.out.tfevents.1721116137.gpu21.buaanlsde.org ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a1b4a7febcf797bcd94f2a947d3cb9bb1cd36ceb304b8f7abfc53e0f8890eba
3
+ size 6908
runs/Jul16_15-50-09_gpu21.buaanlsde.org/events.out.tfevents.1721116320.gpu21.buaanlsde.org ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:72706bf3d0c2f48b05e8f53bcf6664d14a8e2e76248aa133d596f84d963c209f
3
+ size 554725
special_tokens_map.json ADDED
@@ -0,0 +1,21 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>"
5
+ ],
6
+ "eos_token": {
7
+ "content": "<|endoftext|>",
8
+ "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false
12
+ },
13
+ "pad_token": {
14
+ "content": "<|endoftext|>",
15
+ "lstrip": false,
16
+ "normalized": false,
17
+ "rstrip": false,
18
+ "single_word": false
19
+ },
20
+ "unk_token": "<|endoftext|>"
21
+ }
tokenizer_config.json ADDED
@@ -0,0 +1,44 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "151643": {
5
+ "content": "<|endoftext|>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "151644": {
13
+ "content": "<|im_start|>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "151645": {
21
+ "content": "<|im_end|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ }
28
+ },
29
+ "additional_special_tokens": [
30
+ "<|im_start|>",
31
+ "<|im_end|>"
32
+ ],
33
+ "bos_token": null,
34
+ "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
35
+ "clean_up_tokenization_spaces": false,
36
+ "eos_token": "<|endoftext|>",
37
+ "errors": "replace",
38
+ "model_max_length": 2048,
39
+ "pad_token": "<|endoftext|>",
40
+ "padding_side": "right",
41
+ "split_special_tokens": false,
42
+ "tokenizer_class": "Qwen2Tokenizer",
43
+ "unk_token": "<|endoftext|>"
44
+ }
trainer_state.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26f14cea7e53ec20e7d8c0842f5f70351446be1f1e62fd03fb6e3e287e4dbbd7
3
+ size 6459
vocab.json ADDED
The diff for this file is too large to render. See raw diff