|
[ |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 10:46:19", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1417, |
|
"summarize_time": 32.29472152392069, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 14.563165505727133 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 10:48:55", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1417, |
|
"summarize_time": 67.97515447934468, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 33.00641902287801 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 10:48:58", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1440, |
|
"summarize_time": 114.62220064798991, |
|
"generate_output_len_bytes": 2619, |
|
"generate_time": 71.0722058614095 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 10:58:34", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 866, |
|
"summarize_time": 39.54404203097025, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 22.466302394866943 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 11:01:59", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1417, |
|
"summarize_time": 32.1394579410553, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 14.757195552190145 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 10:54:29", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 910, |
|
"summarize_time": 185.14580019315085, |
|
"generate_output_len_bytes": 2042, |
|
"generate_time": 117.13909141222636 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 11:04:37", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 94.98129558563232, |
|
"generate_output_len_bytes": 2512, |
|
"generate_time": 69.4871145884196 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 11:13:08", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1276, |
|
"summarize_time": 43.23498781522115, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 22.826789538065594 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 11:10:08", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 991, |
|
"summarize_time": 90.51939169565837, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 48.96095744768778 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 11:16:48", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1417, |
|
"summarize_time": 31.86189842224121, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 14.209659894307455 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 11:17:39", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1417, |
|
"summarize_time": 71.48081835110982, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 33.5740262667338 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 11:19:24", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 94.17744310696919, |
|
"generate_output_len_bytes": 2512, |
|
"generate_time": 70.12592967351277 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 11:27:57", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1276, |
|
"summarize_time": 42.8066500822703, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 22.626200040181477 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 11:23:22", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 910, |
|
"summarize_time": 186.88371555010477, |
|
"generate_output_len_bytes": 2042, |
|
"generate_time": 117.3530724843343 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 11:39:03", |
|
"git_sha": "55d3b55b", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 991, |
|
"summarize_time": 94.50985678037007, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 50.06416177749634 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 21:08:31", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 38.80374129613241, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 19.23690136273702 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 21:11:49", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1179, |
|
"summarize_time": 178.79640992482504, |
|
"generate_output_len_bytes": 2772, |
|
"generate_time": 93.99476226170857 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 21:25:53", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 53.44271365801493, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 30.641155401865642 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 21:30:30", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 40.80062770843506, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 19.825008392333984 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 21:35:29", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1179, |
|
"summarize_time": 177.35046529769897, |
|
"generate_output_len_bytes": 2772, |
|
"generate_time": 91.73111907641093 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 21:49:20", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 56.894784371058144, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 32.15500020980835 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/18/2023 21:54:11", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 41.46419604619344, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 20.049855709075928 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/18/2023 21:57:39", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1179, |
|
"summarize_time": 183.73364853858948, |
|
"generate_output_len_bytes": 2772, |
|
"generate_time": 94.9052836894989 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/18/2023 22:11:59", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 59.204413731892906, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 33.25332593917847 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/18/2023 22:17:00", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 8, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 42.09002653757731, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 20.106103817621868 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/18/2023 22:20:31", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 8, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1179, |
|
"summarize_time": 185.28164370854697, |
|
"generate_output_len_bytes": 2772, |
|
"generate_time": 95.13023789723714 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/18/2023 22:34:58", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 8, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 60.9919019540151, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 34.328625202178955 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 13:31:34", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 52.49842747052511, |
|
"generate_output_len_bytes": 2172, |
|
"generate_time": 20.686774571736652 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 13:31:55", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 13:35:38", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1007, |
|
"summarize_time": 168.9666860898336, |
|
"generate_output_len_bytes": 2249, |
|
"generate_time": 73.25518870353699 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 13:48:09", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 856, |
|
"summarize_time": 45.30513469378153, |
|
"generate_output_len_bytes": 1802, |
|
"generate_time": 22.000216643015545 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 13:51:56", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 51.64275654157003, |
|
"generate_output_len_bytes": 2172, |
|
"generate_time": 20.737667481104534 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 13:35:47", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 980, |
|
"summarize_time": 280.4669913450877, |
|
"generate_output_len_bytes": 2132, |
|
"generate_time": 141.7793349424998 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 13:57:35", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 869, |
|
"summarize_time": 96.61887431144714, |
|
"generate_output_len_bytes": 3244, |
|
"generate_time": 82.98751719792683 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 13:55:51", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1007, |
|
"summarize_time": 167.52292919158936, |
|
"generate_output_len_bytes": 2249, |
|
"generate_time": 71.82611886660258 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 14:08:08", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 856, |
|
"summarize_time": 47.14254776636759, |
|
"generate_output_len_bytes": 1802, |
|
"generate_time": 22.54850967725118 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 14:15:15", |
|
"git_sha": "d13230ee", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 14:07:15", |
|
"git_sha": "fc4826f2", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 915, |
|
"summarize_time": 89.59958203633626, |
|
"generate_output_len_bytes": 2172, |
|
"generate_time": 42.32424934705099 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 14:15:30", |
|
"git_sha": "d13230ee", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1024, |
|
"summarize_time": 185.44230167071024, |
|
"generate_output_len_bytes": 2122, |
|
"generate_time": 88.11553311347961 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 14:29:36", |
|
"git_sha": "d13230ee", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 922, |
|
"summarize_time": 68.06459252039592, |
|
"generate_output_len_bytes": 1802, |
|
"generate_time": 27.939613421758015 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 14:26:29", |
|
"git_sha": "d13230ee", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 980, |
|
"summarize_time": 280.8310640652974, |
|
"generate_output_len_bytes": 2132, |
|
"generate_time": 143.21916349728903 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 14:48:17", |
|
"git_sha": "d13230ee", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 869, |
|
"summarize_time": 98.47045453389485, |
|
"generate_output_len_bytes": 3244, |
|
"generate_time": 83.71360301971436 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 15:35:13", |
|
"git_sha": "0dec0f52", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 15:49:33", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 16:26:53", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 16:27:32", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 16:29:03", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 17:26:02", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 18:59:16", |
|
"git_sha": "5691db4a", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1075, |
|
"summarize_time": 39.01545596122742, |
|
"generate_output_len_bytes": 2242, |
|
"generate_time": 10.151424566904703 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 19:03:13", |
|
"git_sha": "5691db4a", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 940, |
|
"summarize_time": 21.78233750661214, |
|
"generate_output_len_bytes": 2130, |
|
"generate_time": 15.794983307520548 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 19:38:40", |
|
"git_sha": "6f05e8f1", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1114, |
|
"summarize_time": 7.636120955149333, |
|
"generate_output_len_bytes": 2275, |
|
"generate_time": 7.922623078028361 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 19:41:02", |
|
"git_sha": "6f05e8f1", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1024, |
|
"summarize_time": 10.824170271555582, |
|
"generate_output_len_bytes": 2130, |
|
"generate_time": 9.209020694096884 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 19:55:17", |
|
"git_sha": "2c548f21", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1088, |
|
"summarize_time": 24.39883820215861, |
|
"generate_output_len_bytes": 2275, |
|
"generate_time": 12.755743900934855 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 00:57:21", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 37.113919814427696, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 18.36507821083069 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 01:00:31", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 49.79721482594808, |
|
"generate_output_len_bytes": 2172, |
|
"generate_time": 21.780913591384888 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 01:04:36", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 01:05:26", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1179, |
|
"summarize_time": 181.2461258570353, |
|
"generate_output_len_bytes": 2772, |
|
"generate_time": 92.64811905225118 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 01:19:33", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 800, |
|
"summarize_time": 174.4576851526896, |
|
"generate_output_len_bytes": 2713, |
|
"generate_time": 119.14412077267964 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 01:36:14", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 53.39731526374817, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 31.369641542434692 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 01:40:53", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1000, |
|
"summarize_time": 74.27096923192342, |
|
"generate_output_len_bytes": 1802, |
|
"generate_time": 29.860486666361492 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 01:48:09", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 39.926851193110146, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 18.481745958328247 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 01:51:27", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 51.299002488454185, |
|
"generate_output_len_bytes": 2172, |
|
"generate_time": 21.828503131866455 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 01:56:20", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1179, |
|
"summarize_time": 178.19972308476767, |
|
"generate_output_len_bytes": 2772, |
|
"generate_time": 91.73426882425944 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 02:10:13", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 800, |
|
"summarize_time": 180.7814578215281, |
|
"generate_output_len_bytes": 2713, |
|
"generate_time": 124.72717420260112 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 02:26:43", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 57.08081785837809, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 32.26534946759542 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 02:31:36", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1000, |
|
"summarize_time": 79.9461121559143, |
|
"generate_output_len_bytes": 1802, |
|
"generate_time": 31.403561115264893 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 02:38:23", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 42.33977222442627, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 19.723278522491455 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 02:41:52", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 55.377869288126625, |
|
"generate_output_len_bytes": 2172, |
|
"generate_time": 25.01458676656087 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 02:47:05", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1179, |
|
"summarize_time": 180.53432401021323, |
|
"generate_output_len_bytes": 2772, |
|
"generate_time": 91.93375285466512 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 03:01:07", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 800, |
|
"summarize_time": 179.50477250417075, |
|
"generate_output_len_bytes": 2713, |
|
"generate_time": 124.40728378295898 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 03:17:36", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 58.62867816289266, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 33.394495725631714 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 03:22:37", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1000, |
|
"summarize_time": 78.90612125396729, |
|
"generate_output_len_bytes": 1802, |
|
"generate_time": 30.697617371877033 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/19/2023 03:29:20", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 8, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 40.498607873916626, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 19.509677171707153 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/19/2023 03:32:44", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 8, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 55.3964786529541, |
|
"generate_output_len_bytes": 2172, |
|
"generate_time": 24.347585439682007 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/19/2023 03:37:55", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 8, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1179, |
|
"summarize_time": 186.71331850687662, |
|
"generate_output_len_bytes": 2772, |
|
"generate_time": 95.784650405248 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/19/2023 03:52:28", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 8, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 800, |
|
"summarize_time": 185.3280005455017, |
|
"generate_output_len_bytes": 2713, |
|
"generate_time": 125.91738017400105 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/19/2023 04:09:18", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 8, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1002, |
|
"summarize_time": 60.18280680974325, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 33.386961142222084 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/19/2023 04:14:25", |
|
"git_sha": "a227be4f", |
|
"n_gpus": 8, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1000, |
|
"summarize_time": 83.04790727297465, |
|
"generate_output_len_bytes": 1802, |
|
"generate_time": 32.24992283185323 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 23:26:19", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1417, |
|
"summarize_time": 47.03754989306132, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 19.964784463246662 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 23:33:09", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 915, |
|
"summarize_time": 71.91136892636617, |
|
"generate_output_len_bytes": 2480, |
|
"generate_time": 33.6295014222463 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 23:44:08", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 00:45:42", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1007, |
|
"summarize_time": 148.61560583114624, |
|
"generate_output_len_bytes": 2357, |
|
"generate_time": 89.01266026496887 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 00:58:00", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 763, |
|
"summarize_time": 193.99270629882812, |
|
"generate_output_len_bytes": 2129, |
|
"generate_time": 95.66660761833191 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 01:13:01", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 01:13:55", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 991, |
|
"summarize_time": 61.52411222457886, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 32.030215660730995 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 01:19:00", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 1, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1000, |
|
"summarize_time": 81.13888708750407, |
|
"generate_output_len_bytes": 3486, |
|
"generate_time": 55.5331826210022 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 01:27:49", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1417, |
|
"summarize_time": 47.41046245892843, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 20.660600344340008 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 01:34:28", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 915, |
|
"summarize_time": 72.85646979014079, |
|
"generate_output_len_bytes": 2480, |
|
"generate_time": 34.05861854553223 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 02:39:22", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1007, |
|
"summarize_time": 152.54357608159384, |
|
"generate_output_len_bytes": 2357, |
|
"generate_time": 91.51808977127075 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 02:52:58", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 763, |
|
"summarize_time": 195.92926557858786, |
|
"generate_output_len_bytes": 2129, |
|
"generate_time": 96.55542047818501 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 03:15:01", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 991, |
|
"summarize_time": 64.64422671000163, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 33.30378039677938 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 03:20:19", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 2, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1000, |
|
"summarize_time": 84.57761120796204, |
|
"generate_output_len_bytes": 3486, |
|
"generate_time": 57.59072462717692 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 03:28:44", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1417, |
|
"summarize_time": 49.08898218472799, |
|
"generate_output_len_bytes": 2384, |
|
"generate_time": 21.489527861277264 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 03:32:39", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 915, |
|
"summarize_time": 74.43774898846944, |
|
"generate_output_len_bytes": 2480, |
|
"generate_time": 34.72673638661703 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 03:39:21", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1007, |
|
"summarize_time": 153.41076453526816, |
|
"generate_output_len_bytes": 2357, |
|
"generate_time": 91.14894040425618 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 03:52:00", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 763, |
|
"summarize_time": 199.79869039853415, |
|
"generate_output_len_bytes": 2129, |
|
"generate_time": 98.61504419644673 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 04:08:12", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 991, |
|
"summarize_time": 66.49260465304057, |
|
"generate_output_len_bytes": 2927, |
|
"generate_time": 34.17951035499573 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 04:13:39", |
|
"git_sha": "0cdb75ef", |
|
"n_gpus": 4, |
|
"transformers": "4.30.2", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1000, |
|
"summarize_time": 87.65787092844646, |
|
"generate_output_len_bytes": 3486, |
|
"generate_time": 59.3750696182251 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 22:22:24", |
|
"git_sha": "b63768c6", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 948, |
|
"summarize_time": 122.13213857014973, |
|
"generate_output_len_bytes": 2826, |
|
"generate_time": 66.34098903338115 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/18/2023 22:33:33", |
|
"git_sha": "c1348fb3", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 948, |
|
"summarize_time": 120.53812781969707, |
|
"generate_output_len_bytes": 2826, |
|
"generate_time": 67.28052496910095 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 22:56:52", |
|
"git_sha": "fb84de76", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1036, |
|
"summarize_time": 29.128981749216717, |
|
"generate_output_len_bytes": 2242, |
|
"generate_time": 12.197122732798258 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/18/2023 23:00:33", |
|
"git_sha": "fb84de76", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 05:47:43", |
|
"git_sha": "22352acd", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 05:48:58", |
|
"git_sha": "22352acd", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/19/2023 05:50:40", |
|
"git_sha": "22352acd", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 948, |
|
"summarize_time": 165.05752809842429, |
|
"generate_output_len_bytes": 2605, |
|
"generate_time": 93.80659619967143 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 06:05:51", |
|
"git_sha": "22352acd", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 06:10:05", |
|
"git_sha": "22352acd", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 906, |
|
"summarize_time": 410.0691332022349, |
|
"generate_output_len_bytes": 521, |
|
"generate_time": 57.71272214253744 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 06:36:58", |
|
"git_sha": "22352acd", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 948, |
|
"summarize_time": 171.74388321240744, |
|
"generate_output_len_bytes": 2605, |
|
"generate_time": 97.00725762049358 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 06:51:13", |
|
"git_sha": "22352acd", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 792, |
|
"summarize_time": 267.0555826822917, |
|
"generate_output_len_bytes": 2783, |
|
"generate_time": 163.99818523724875 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 07:13:35", |
|
"git_sha": "22352acd", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 906, |
|
"summarize_time": 413.9569679101308, |
|
"generate_output_len_bytes": 521, |
|
"generate_time": 58.52583885192871 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/19/2023 07:38:02", |
|
"git_sha": "22352acd", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 948, |
|
"summarize_time": 175.4907926718394, |
|
"generate_output_len_bytes": 2605, |
|
"generate_time": 98.97720170021057 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/19/2023 12:35:08", |
|
"git_sha": "29a002e5", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "timemachine", |
|
"gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 983, |
|
"summarize_time": 42.21107586224874, |
|
"generate_output_len_bytes": 2130, |
|
"generate_time": 16.94527777036031 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/21/2023 20:03:36", |
|
"git_sha": "51318f44", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 41.0461368560791, |
|
"generate_output_len_bytes": 2383, |
|
"generate_time": 19.614749511082966 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/21/2023 20:07:35", |
|
"git_sha": "51318f44", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 42.8376894791921, |
|
"generate_output_len_bytes": 2383, |
|
"generate_time": 20.2719091574351 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/21/2023 20:42:46", |
|
"git_sha": "2f4bb620", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/21/2023 20:50:19", |
|
"git_sha": "2f4bb620", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 915, |
|
"summarize_time": 66.52468911806743, |
|
"generate_output_len_bytes": 2479, |
|
"generate_time": 29.828714847564697 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/21/2023 20:56:04", |
|
"git_sha": "2f4bb620", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", |
|
"exception": "OOM" |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/21/2023 19:55:35", |
|
"git_sha": "51318f44", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 38.753786404927574, |
|
"generate_output_len_bytes": 2383, |
|
"generate_time": 19.529522736867268 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/21/2023 20:36:13", |
|
"git_sha": "51318f44", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 41.024452924728394, |
|
"generate_output_len_bytes": 2383, |
|
"generate_time": 20.29120985666911 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/21/2023 20:40:08", |
|
"git_sha": "51318f44", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 54.554532527923584, |
|
"generate_output_len_bytes": 2171, |
|
"generate_time": 24.604793945948284 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/21/2023 20:50:05", |
|
"git_sha": "51318f44", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 41.09950613975525, |
|
"generate_output_len_bytes": 2383, |
|
"generate_time": 20.947362899780273 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/21/2023 20:54:08", |
|
"git_sha": "51318f44", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 58.3172922929128, |
|
"generate_output_len_bytes": 2171, |
|
"generate_time": 25.735217014948528 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/21/2023 21:01:04", |
|
"git_sha": "51318f44", |
|
"n_gpus": 8, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 42.85940829912821, |
|
"generate_output_len_bytes": 2383, |
|
"generate_time": 21.380353291829426 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/21/2023 21:05:24", |
|
"git_sha": "51318f44", |
|
"n_gpus": 8, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 54.235164642333984, |
|
"generate_output_len_bytes": 2171, |
|
"generate_time": 25.70338026682536 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/21/2023 21:10:37", |
|
"git_sha": "51318f44", |
|
"n_gpus": 8, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 927, |
|
"summarize_time": 133.53030570348105, |
|
"generate_output_len_bytes": 2782, |
|
"generate_time": 72.97924383481343 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/21/2023 22:18:17", |
|
"git_sha": "51318f44", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 927, |
|
"summarize_time": 131.45291074117026, |
|
"generate_output_len_bytes": 2782, |
|
"generate_time": 72.30849742889404 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/21/2023 22:51:09", |
|
"git_sha": "383b6bbc", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 39.269713958104454, |
|
"generate_output_len_bytes": 2383, |
|
"generate_time": 19.65731406211853 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/21/2023 22:54:54", |
|
"git_sha": "383b6bbc", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 51.84283971786499, |
|
"generate_output_len_bytes": 2171, |
|
"generate_time": 28.441521485646565 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/21/2023 23:13:10", |
|
"git_sha": "383b6bbc", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 53.383726040522255, |
|
"generate_output_len_bytes": 2171, |
|
"generate_time": 24.422890504201252 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 4, |
|
"reps": 3, |
|
"date": "08/21/2023 23:18:04", |
|
"git_sha": "383b6bbc", |
|
"n_gpus": 4, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 52.791220347086586, |
|
"generate_output_len_bytes": 2171, |
|
"generate_time": 25.378511508305866 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 8, |
|
"reps": 3, |
|
"date": "08/21/2023 23:23:11", |
|
"git_sha": "383b6bbc", |
|
"n_gpus": 8, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.8", |
|
"hostname": "cloudvm", |
|
"gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1046, |
|
"summarize_time": 56.3846542040507, |
|
"generate_output_len_bytes": 2171, |
|
"generate_time": 26.636192480723064 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 1, |
|
"reps": 3, |
|
"date": "08/21/2023 23:52:44", |
|
"git_sha": "da69b822", |
|
"n_gpus": 1, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1267, |
|
"summarize_time": 40.36223220825195, |
|
"generate_output_len_bytes": 2383, |
|
"generate_time": 19.87660264968872 |
|
}, |
|
{ |
|
"backend": "text-generation-inference", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 2, |
|
"reps": 3, |
|
"date": "08/22/2023 00:15:05", |
|
"git_sha": "e843e8c3", |
|
"n_gpus": 2, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "recypabaszmhhmuae", |
|
"gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 915, |
|
"summarize_time": 64.78201874097188, |
|
"generate_output_len_bytes": 2479, |
|
"generate_time": 29.02147897084554 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 16, |
|
"ngpus": 0, |
|
"reps": 3, |
|
"date": "08/22/2023 19:01:15", |
|
"git_sha": "855b7d15", |
|
"n_gpus": 0, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "CPU", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1351, |
|
"summarize_time": 1215.5185990333557, |
|
"generate_output_len_bytes": 849, |
|
"generate_time": 180.56836318969727 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 8, |
|
"ngpus": 0, |
|
"reps": 3, |
|
"date": "08/22/2023 20:11:16", |
|
"git_sha": "855b7d15", |
|
"n_gpus": 0, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "CPU", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1353, |
|
"summarize_time": 1216.9783231417339, |
|
"generate_output_len_bytes": 849, |
|
"generate_time": 180.42225472132364 |
|
}, |
|
{ |
|
"backend": "transformers", |
|
"base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", |
|
"task": "summary_and_generate", |
|
"bits": 4, |
|
"ngpus": 0, |
|
"reps": 3, |
|
"date": "08/22/2023 21:21:20", |
|
"git_sha": "855b7d15", |
|
"n_gpus": 0, |
|
"transformers": "4.31.0", |
|
"bitsandbytes": "0.41.1", |
|
"cuda": "11.7", |
|
"hostname": "rippa", |
|
"gpus": "CPU", |
|
"summarize_input_len_bytes": 857252, |
|
"summarize_output_len_bytes": 1354, |
|
"summarize_time": 1217.1687794526417, |
|
"generate_output_len_bytes": 843, |
|
"generate_time": 180.78463260332742 |
|
} |
|
] |
|
|