| [ | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 10:46:19", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1417, | |
| "summarize_time": 32.29472152392069, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 14.563165505727133 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 10:48:55", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1417, | |
| "summarize_time": 67.97515447934468, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 33.00641902287801 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 10:48:58", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1440, | |
| "summarize_time": 114.62220064798991, | |
| "generate_output_len_bytes": 2619, | |
| "generate_time": 71.0722058614095 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 10:58:34", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 866, | |
| "summarize_time": 39.54404203097025, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 22.466302394866943 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 11:01:59", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1417, | |
| "summarize_time": 32.1394579410553, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 14.757195552190145 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 10:54:29", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 910, | |
| "summarize_time": 185.14580019315085, | |
| "generate_output_len_bytes": 2042, | |
| "generate_time": 117.13909141222636 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 11:04:37", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 94.98129558563232, | |
| "generate_output_len_bytes": 2512, | |
| "generate_time": 69.4871145884196 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 11:13:08", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1276, | |
| "summarize_time": 43.23498781522115, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 22.826789538065594 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 11:10:08", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 991, | |
| "summarize_time": 90.51939169565837, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 48.96095744768778 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 11:16:48", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1417, | |
| "summarize_time": 31.86189842224121, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 14.209659894307455 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 11:17:39", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1417, | |
| "summarize_time": 71.48081835110982, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 33.5740262667338 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 11:19:24", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 94.17744310696919, | |
| "generate_output_len_bytes": 2512, | |
| "generate_time": 70.12592967351277 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 11:27:57", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1276, | |
| "summarize_time": 42.8066500822703, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 22.626200040181477 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 11:23:22", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 910, | |
| "summarize_time": 186.88371555010477, | |
| "generate_output_len_bytes": 2042, | |
| "generate_time": 117.3530724843343 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 11:39:03", | |
| "git_sha": "55d3b55b", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 991, | |
| "summarize_time": 94.50985678037007, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 50.06416177749634 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 21:08:31", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 38.80374129613241, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 19.23690136273702 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 21:11:49", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1179, | |
| "summarize_time": 178.79640992482504, | |
| "generate_output_len_bytes": 2772, | |
| "generate_time": 93.99476226170857 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 21:25:53", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 53.44271365801493, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 30.641155401865642 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 21:30:30", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 40.80062770843506, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 19.825008392333984 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 21:35:29", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1179, | |
| "summarize_time": 177.35046529769897, | |
| "generate_output_len_bytes": 2772, | |
| "generate_time": 91.73111907641093 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 21:49:20", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 56.894784371058144, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 32.15500020980835 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/18/2023 21:54:11", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 41.46419604619344, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 20.049855709075928 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/18/2023 21:57:39", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1179, | |
| "summarize_time": 183.73364853858948, | |
| "generate_output_len_bytes": 2772, | |
| "generate_time": 94.9052836894989 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/18/2023 22:11:59", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 59.204413731892906, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 33.25332593917847 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/18/2023 22:17:00", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 8, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 42.09002653757731, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 20.106103817621868 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/18/2023 22:20:31", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 8, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1179, | |
| "summarize_time": 185.28164370854697, | |
| "generate_output_len_bytes": 2772, | |
| "generate_time": 95.13023789723714 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/18/2023 22:34:58", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 8, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 60.9919019540151, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 34.328625202178955 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 13:31:34", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 52.49842747052511, | |
| "generate_output_len_bytes": 2172, | |
| "generate_time": 20.686774571736652 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 13:31:55", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 13:35:38", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1007, | |
| "summarize_time": 168.9666860898336, | |
| "generate_output_len_bytes": 2249, | |
| "generate_time": 73.25518870353699 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 13:48:09", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 856, | |
| "summarize_time": 45.30513469378153, | |
| "generate_output_len_bytes": 1802, | |
| "generate_time": 22.000216643015545 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 13:51:56", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 51.64275654157003, | |
| "generate_output_len_bytes": 2172, | |
| "generate_time": 20.737667481104534 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 13:35:47", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 980, | |
| "summarize_time": 280.4669913450877, | |
| "generate_output_len_bytes": 2132, | |
| "generate_time": 141.7793349424998 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 13:57:35", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 869, | |
| "summarize_time": 96.61887431144714, | |
| "generate_output_len_bytes": 3244, | |
| "generate_time": 82.98751719792683 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 13:55:51", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1007, | |
| "summarize_time": 167.52292919158936, | |
| "generate_output_len_bytes": 2249, | |
| "generate_time": 71.82611886660258 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 14:08:08", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 856, | |
| "summarize_time": 47.14254776636759, | |
| "generate_output_len_bytes": 1802, | |
| "generate_time": 22.54850967725118 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 14:15:15", | |
| "git_sha": "d13230ee", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 14:07:15", | |
| "git_sha": "fc4826f2", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 915, | |
| "summarize_time": 89.59958203633626, | |
| "generate_output_len_bytes": 2172, | |
| "generate_time": 42.32424934705099 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 14:15:30", | |
| "git_sha": "d13230ee", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1024, | |
| "summarize_time": 185.44230167071024, | |
| "generate_output_len_bytes": 2122, | |
| "generate_time": 88.11553311347961 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 14:29:36", | |
| "git_sha": "d13230ee", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 922, | |
| "summarize_time": 68.06459252039592, | |
| "generate_output_len_bytes": 1802, | |
| "generate_time": 27.939613421758015 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 14:26:29", | |
| "git_sha": "d13230ee", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 980, | |
| "summarize_time": 280.8310640652974, | |
| "generate_output_len_bytes": 2132, | |
| "generate_time": 143.21916349728903 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 14:48:17", | |
| "git_sha": "d13230ee", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 869, | |
| "summarize_time": 98.47045453389485, | |
| "generate_output_len_bytes": 3244, | |
| "generate_time": 83.71360301971436 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 15:35:13", | |
| "git_sha": "0dec0f52", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 15:49:33", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 16:26:53", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 16:27:32", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 16:29:03", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 17:26:02", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 18:59:16", | |
| "git_sha": "5691db4a", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1075, | |
| "summarize_time": 39.01545596122742, | |
| "generate_output_len_bytes": 2242, | |
| "generate_time": 10.151424566904703 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 19:03:13", | |
| "git_sha": "5691db4a", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 940, | |
| "summarize_time": 21.78233750661214, | |
| "generate_output_len_bytes": 2130, | |
| "generate_time": 15.794983307520548 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 19:38:40", | |
| "git_sha": "6f05e8f1", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1114, | |
| "summarize_time": 7.636120955149333, | |
| "generate_output_len_bytes": 2275, | |
| "generate_time": 7.922623078028361 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 19:41:02", | |
| "git_sha": "6f05e8f1", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1024, | |
| "summarize_time": 10.824170271555582, | |
| "generate_output_len_bytes": 2130, | |
| "generate_time": 9.209020694096884 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 19:55:17", | |
| "git_sha": "2c548f21", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA GeForce RTX 4090 (24564 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1088, | |
| "summarize_time": 24.39883820215861, | |
| "generate_output_len_bytes": 2275, | |
| "generate_time": 12.755743900934855 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 00:57:21", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 37.113919814427696, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 18.36507821083069 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 01:00:31", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 49.79721482594808, | |
| "generate_output_len_bytes": 2172, | |
| "generate_time": 21.780913591384888 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 01:04:36", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 01:05:26", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1179, | |
| "summarize_time": 181.2461258570353, | |
| "generate_output_len_bytes": 2772, | |
| "generate_time": 92.64811905225118 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 01:19:33", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 800, | |
| "summarize_time": 174.4576851526896, | |
| "generate_output_len_bytes": 2713, | |
| "generate_time": 119.14412077267964 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 01:36:14", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 53.39731526374817, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 31.369641542434692 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 01:40:53", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1000, | |
| "summarize_time": 74.27096923192342, | |
| "generate_output_len_bytes": 1802, | |
| "generate_time": 29.860486666361492 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 01:48:09", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 39.926851193110146, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 18.481745958328247 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 01:51:27", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 51.299002488454185, | |
| "generate_output_len_bytes": 2172, | |
| "generate_time": 21.828503131866455 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 01:56:20", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1179, | |
| "summarize_time": 178.19972308476767, | |
| "generate_output_len_bytes": 2772, | |
| "generate_time": 91.73426882425944 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 02:10:13", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 800, | |
| "summarize_time": 180.7814578215281, | |
| "generate_output_len_bytes": 2713, | |
| "generate_time": 124.72717420260112 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 02:26:43", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 57.08081785837809, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 32.26534946759542 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 02:31:36", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1000, | |
| "summarize_time": 79.9461121559143, | |
| "generate_output_len_bytes": 1802, | |
| "generate_time": 31.403561115264893 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 02:38:23", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 42.33977222442627, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 19.723278522491455 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 02:41:52", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 55.377869288126625, | |
| "generate_output_len_bytes": 2172, | |
| "generate_time": 25.01458676656087 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 02:47:05", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1179, | |
| "summarize_time": 180.53432401021323, | |
| "generate_output_len_bytes": 2772, | |
| "generate_time": 91.93375285466512 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 03:01:07", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 800, | |
| "summarize_time": 179.50477250417075, | |
| "generate_output_len_bytes": 2713, | |
| "generate_time": 124.40728378295898 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 03:17:36", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 58.62867816289266, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 33.394495725631714 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 03:22:37", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1000, | |
| "summarize_time": 78.90612125396729, | |
| "generate_output_len_bytes": 1802, | |
| "generate_time": 30.697617371877033 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/19/2023 03:29:20", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 8, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 40.498607873916626, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 19.509677171707153 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/19/2023 03:32:44", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 8, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 55.3964786529541, | |
| "generate_output_len_bytes": 2172, | |
| "generate_time": 24.347585439682007 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/19/2023 03:37:55", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 8, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1179, | |
| "summarize_time": 186.71331850687662, | |
| "generate_output_len_bytes": 2772, | |
| "generate_time": 95.784650405248 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/19/2023 03:52:28", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 8, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 800, | |
| "summarize_time": 185.3280005455017, | |
| "generate_output_len_bytes": 2713, | |
| "generate_time": 125.91738017400105 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/19/2023 04:09:18", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 8, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1002, | |
| "summarize_time": 60.18280680974325, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 33.386961142222084 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/19/2023 04:14:25", | |
| "git_sha": "a227be4f", | |
| "n_gpus": 8, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1000, | |
| "summarize_time": 83.04790727297465, | |
| "generate_output_len_bytes": 1802, | |
| "generate_time": 32.24992283185323 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 23:26:19", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1417, | |
| "summarize_time": 47.03754989306132, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 19.964784463246662 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 23:33:09", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 915, | |
| "summarize_time": 71.91136892636617, | |
| "generate_output_len_bytes": 2480, | |
| "generate_time": 33.6295014222463 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 23:44:08", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 00:45:42", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1007, | |
| "summarize_time": 148.61560583114624, | |
| "generate_output_len_bytes": 2357, | |
| "generate_time": 89.01266026496887 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 00:58:00", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 763, | |
| "summarize_time": 193.99270629882812, | |
| "generate_output_len_bytes": 2129, | |
| "generate_time": 95.66660761833191 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 01:13:01", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 01:13:55", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 991, | |
| "summarize_time": 61.52411222457886, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 32.030215660730995 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 01:19:00", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 1, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1000, | |
| "summarize_time": 81.13888708750407, | |
| "generate_output_len_bytes": 3486, | |
| "generate_time": 55.5331826210022 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 01:27:49", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1417, | |
| "summarize_time": 47.41046245892843, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 20.660600344340008 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 01:34:28", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 915, | |
| "summarize_time": 72.85646979014079, | |
| "generate_output_len_bytes": 2480, | |
| "generate_time": 34.05861854553223 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 02:39:22", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1007, | |
| "summarize_time": 152.54357608159384, | |
| "generate_output_len_bytes": 2357, | |
| "generate_time": 91.51808977127075 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 02:52:58", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 763, | |
| "summarize_time": 195.92926557858786, | |
| "generate_output_len_bytes": 2129, | |
| "generate_time": 96.55542047818501 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 03:15:01", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 991, | |
| "summarize_time": 64.64422671000163, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 33.30378039677938 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 03:20:19", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 2, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1000, | |
| "summarize_time": 84.57761120796204, | |
| "generate_output_len_bytes": 3486, | |
| "generate_time": 57.59072462717692 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 03:28:44", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1417, | |
| "summarize_time": 49.08898218472799, | |
| "generate_output_len_bytes": 2384, | |
| "generate_time": 21.489527861277264 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 03:32:39", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 915, | |
| "summarize_time": 74.43774898846944, | |
| "generate_output_len_bytes": 2480, | |
| "generate_time": 34.72673638661703 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 03:39:21", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1007, | |
| "summarize_time": 153.41076453526816, | |
| "generate_output_len_bytes": 2357, | |
| "generate_time": 91.14894040425618 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 03:52:00", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 763, | |
| "summarize_time": 199.79869039853415, | |
| "generate_output_len_bytes": 2129, | |
| "generate_time": 98.61504419644673 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 04:08:12", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 991, | |
| "summarize_time": 66.49260465304057, | |
| "generate_output_len_bytes": 2927, | |
| "generate_time": 34.17951035499573 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 04:13:39", | |
| "git_sha": "0cdb75ef", | |
| "n_gpus": 4, | |
| "transformers": "4.30.2", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1000, | |
| "summarize_time": 87.65787092844646, | |
| "generate_output_len_bytes": 3486, | |
| "generate_time": 59.3750696182251 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 22:22:24", | |
| "git_sha": "b63768c6", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "1 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 948, | |
| "summarize_time": 122.13213857014973, | |
| "generate_output_len_bytes": 2826, | |
| "generate_time": 66.34098903338115 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/18/2023 22:33:33", | |
| "git_sha": "c1348fb3", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "2 x NVIDIA RTX 6000 Ada Generation (49140 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 948, | |
| "summarize_time": 120.53812781969707, | |
| "generate_output_len_bytes": 2826, | |
| "generate_time": 67.28052496910095 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 22:56:52", | |
| "git_sha": "fb84de76", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1036, | |
| "summarize_time": 29.128981749216717, | |
| "generate_output_len_bytes": 2242, | |
| "generate_time": 12.197122732798258 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/18/2023 23:00:33", | |
| "git_sha": "fb84de76", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "1 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 05:47:43", | |
| "git_sha": "22352acd", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 05:48:58", | |
| "git_sha": "22352acd", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/19/2023 05:50:40", | |
| "git_sha": "22352acd", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 948, | |
| "summarize_time": 165.05752809842429, | |
| "generate_output_len_bytes": 2605, | |
| "generate_time": 93.80659619967143 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 06:05:51", | |
| "git_sha": "22352acd", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 06:10:05", | |
| "git_sha": "22352acd", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 906, | |
| "summarize_time": 410.0691332022349, | |
| "generate_output_len_bytes": 521, | |
| "generate_time": 57.71272214253744 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 06:36:58", | |
| "git_sha": "22352acd", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 948, | |
| "summarize_time": 171.74388321240744, | |
| "generate_output_len_bytes": 2605, | |
| "generate_time": 97.00725762049358 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 06:51:13", | |
| "git_sha": "22352acd", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 792, | |
| "summarize_time": 267.0555826822917, | |
| "generate_output_len_bytes": 2783, | |
| "generate_time": 163.99818523724875 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 07:13:35", | |
| "git_sha": "22352acd", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 906, | |
| "summarize_time": 413.9569679101308, | |
| "generate_output_len_bytes": 521, | |
| "generate_time": 58.52583885192871 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/19/2023 07:38:02", | |
| "git_sha": "22352acd", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 948, | |
| "summarize_time": 175.4907926718394, | |
| "generate_output_len_bytes": 2605, | |
| "generate_time": 98.97720170021057 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/19/2023 12:35:08", | |
| "git_sha": "29a002e5", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "timemachine", | |
| "gpus": "2 x NVIDIA GeForce RTX 3090 (24576 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 983, | |
| "summarize_time": 42.21107586224874, | |
| "generate_output_len_bytes": 2130, | |
| "generate_time": 16.94527777036031 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/21/2023 20:03:36", | |
| "git_sha": "51318f44", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 41.0461368560791, | |
| "generate_output_len_bytes": 2383, | |
| "generate_time": 19.614749511082966 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/21/2023 20:07:35", | |
| "git_sha": "51318f44", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 42.8376894791921, | |
| "generate_output_len_bytes": 2383, | |
| "generate_time": 20.2719091574351 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/21/2023 20:42:46", | |
| "git_sha": "2f4bb620", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/21/2023 20:50:19", | |
| "git_sha": "2f4bb620", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 915, | |
| "summarize_time": 66.52468911806743, | |
| "generate_output_len_bytes": 2479, | |
| "generate_time": 29.828714847564697 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/21/2023 20:56:04", | |
| "git_sha": "2f4bb620", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "4 x NVIDIA RTX A6000 (46068 MiB)", | |
| "exception": "OOM" | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/21/2023 19:55:35", | |
| "git_sha": "51318f44", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 38.753786404927574, | |
| "generate_output_len_bytes": 2383, | |
| "generate_time": 19.529522736867268 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/21/2023 20:36:13", | |
| "git_sha": "51318f44", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 41.024452924728394, | |
| "generate_output_len_bytes": 2383, | |
| "generate_time": 20.29120985666911 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/21/2023 20:40:08", | |
| "git_sha": "51318f44", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 54.554532527923584, | |
| "generate_output_len_bytes": 2171, | |
| "generate_time": 24.604793945948284 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/21/2023 20:50:05", | |
| "git_sha": "51318f44", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 41.09950613975525, | |
| "generate_output_len_bytes": 2383, | |
| "generate_time": 20.947362899780273 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/21/2023 20:54:08", | |
| "git_sha": "51318f44", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 58.3172922929128, | |
| "generate_output_len_bytes": 2171, | |
| "generate_time": 25.735217014948528 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/21/2023 21:01:04", | |
| "git_sha": "51318f44", | |
| "n_gpus": 8, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 42.85940829912821, | |
| "generate_output_len_bytes": 2383, | |
| "generate_time": 21.380353291829426 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/21/2023 21:05:24", | |
| "git_sha": "51318f44", | |
| "n_gpus": 8, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 54.235164642333984, | |
| "generate_output_len_bytes": 2171, | |
| "generate_time": 25.70338026682536 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/21/2023 21:10:37", | |
| "git_sha": "51318f44", | |
| "n_gpus": 8, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 927, | |
| "summarize_time": 133.53030570348105, | |
| "generate_output_len_bytes": 2782, | |
| "generate_time": 72.97924383481343 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-70b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/21/2023 22:18:17", | |
| "git_sha": "51318f44", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 927, | |
| "summarize_time": 131.45291074117026, | |
| "generate_output_len_bytes": 2782, | |
| "generate_time": 72.30849742889404 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/21/2023 22:51:09", | |
| "git_sha": "383b6bbc", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 39.269713958104454, | |
| "generate_output_len_bytes": 2383, | |
| "generate_time": 19.65731406211853 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/21/2023 22:54:54", | |
| "git_sha": "383b6bbc", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "1 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 51.84283971786499, | |
| "generate_output_len_bytes": 2171, | |
| "generate_time": 28.441521485646565 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/21/2023 23:13:10", | |
| "git_sha": "383b6bbc", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "2 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 53.383726040522255, | |
| "generate_output_len_bytes": 2171, | |
| "generate_time": 24.422890504201252 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 4, | |
| "reps": 3, | |
| "date": "08/21/2023 23:18:04", | |
| "git_sha": "383b6bbc", | |
| "n_gpus": 4, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "4 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 52.791220347086586, | |
| "generate_output_len_bytes": 2171, | |
| "generate_time": 25.378511508305866 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 8, | |
| "reps": 3, | |
| "date": "08/21/2023 23:23:11", | |
| "git_sha": "383b6bbc", | |
| "n_gpus": 8, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.8", | |
| "hostname": "cloudvm", | |
| "gpus": "8 x NVIDIA A100-SXM4-80GB (81920 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1046, | |
| "summarize_time": 56.3846542040507, | |
| "generate_output_len_bytes": 2171, | |
| "generate_time": 26.636192480723064 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 1, | |
| "reps": 3, | |
| "date": "08/21/2023 23:52:44", | |
| "git_sha": "da69b822", | |
| "n_gpus": 1, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "1 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1267, | |
| "summarize_time": 40.36223220825195, | |
| "generate_output_len_bytes": 2383, | |
| "generate_time": 19.87660264968872 | |
| }, | |
| { | |
| "backend": "text-generation-inference", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-13b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 2, | |
| "reps": 3, | |
| "date": "08/22/2023 00:15:05", | |
| "git_sha": "e843e8c3", | |
| "n_gpus": 2, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "recypabaszmhhmuae", | |
| "gpus": "2 x NVIDIA RTX A6000 (46068 MiB)", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 915, | |
| "summarize_time": 64.78201874097188, | |
| "generate_output_len_bytes": 2479, | |
| "generate_time": 29.02147897084554 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 16, | |
| "ngpus": 0, | |
| "reps": 3, | |
| "date": "08/22/2023 19:01:15", | |
| "git_sha": "855b7d15", | |
| "n_gpus": 0, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "CPU", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1351, | |
| "summarize_time": 1215.5185990333557, | |
| "generate_output_len_bytes": 849, | |
| "generate_time": 180.56836318969727 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 8, | |
| "ngpus": 0, | |
| "reps": 3, | |
| "date": "08/22/2023 20:11:16", | |
| "git_sha": "855b7d15", | |
| "n_gpus": 0, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "CPU", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1353, | |
| "summarize_time": 1216.9783231417339, | |
| "generate_output_len_bytes": 849, | |
| "generate_time": 180.42225472132364 | |
| }, | |
| { | |
| "backend": "transformers", | |
| "base_model": "h2oai/h2ogpt-4096-llama2-7b-chat", | |
| "task": "summary_and_generate", | |
| "bits": 4, | |
| "ngpus": 0, | |
| "reps": 3, | |
| "date": "08/22/2023 21:21:20", | |
| "git_sha": "855b7d15", | |
| "n_gpus": 0, | |
| "transformers": "4.31.0", | |
| "bitsandbytes": "0.41.1", | |
| "cuda": "11.7", | |
| "hostname": "rippa", | |
| "gpus": "CPU", | |
| "summarize_input_len_bytes": 857252, | |
| "summarize_output_len_bytes": 1354, | |
| "summarize_time": 1217.1687794526417, | |
| "generate_output_len_bytes": 843, | |
| "generate_time": 180.78463260332742 | |
| } | |
| ] | |