From 06dab189cb517cabe81503caa755849d99c23b97 Mon Sep 17 00:00:00 2001 From: Ilyas Moutawwakil <57442720+IlyasMoutawwakil@users.noreply.github.com> Date: Mon, 19 Feb 2024 09:42:13 +0100 Subject: [PATCH] moved complex examples (#127) --- .gitignore | 5 +- README.md | 6 +- examples/api_launch.py | 1 - examples/fast-mteb/README.md | 44 -- .../artifacts/forward_latency_plot.png | Bin 31081 -> 0 bytes .../artifacts/forward_throughput_plot.png | Bin 44934 -> 0 bytes examples/fast-mteb/artifacts/full_report.csv | 52 -- examples/fast-mteb/artifacts/rich_table.svg | 479 --------------- examples/fast-mteb/artifacts/short_report.csv | 52 -- .../fast-mteb/configs/bge_base_config.yaml | 31 - .../bge_batch_size_sweep_baseline.yaml | 12 - .../bge_batch_size_sweep_ort_cuda_o4.yaml | 10 - .../bge_batch_size_sweep_ort_trt_fp16.yaml | 11 - .../configs/bge_seq_len_sweep_baseline.yaml | 12 - .../bge_seq_len_sweep_ort_cuda_o4.yaml | 10 - .../bge_seq_len_sweep_ort_trt_fp16.yaml | 11 - .../0/.hydra/config.yaml | 69 --- .../0/.hydra/hydra.yaml | 175 ------ .../0/.hydra/overrides.yaml | 2 - .../0/hydra_config.yaml | 69 --- .../0/inference_results.csv | 2 - .../10/.hydra/config.yaml | 69 --- .../10/.hydra/hydra.yaml | 175 ------ .../10/.hydra/overrides.yaml | 2 - .../10/hydra_config.yaml | 69 --- .../10/inference_results.csv | 2 - .../7/.hydra/config.yaml | 69 --- .../7/.hydra/hydra.yaml | 175 ------ .../7/.hydra/overrides.yaml | 2 - .../7/hydra_config.yaml | 69 --- .../7/inference_results.csv | 2 - .../4/.hydra/config.yaml | 69 --- .../4/.hydra/hydra.yaml | 175 ------ .../4/.hydra/overrides.yaml | 2 - .../4/hydra_config.yaml | 69 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 69 --- .../1/.hydra/hydra.yaml | 175 ------ .../1/.hydra/overrides.yaml | 2 - .../1/hydra_config.yaml | 69 --- .../1/inference_results.csv | 2 - .../11/.hydra/config.yaml | 69 --- .../11/.hydra/hydra.yaml | 175 ------ .../11/.hydra/overrides.yaml | 2 - .../11/hydra_config.yaml | 69 --- .../11/inference_results.csv | 2 - .../8/.hydra/config.yaml | 69 --- .../8/.hydra/hydra.yaml | 175 ------ .../8/.hydra/overrides.yaml | 2 - .../8/hydra_config.yaml | 69 --- .../8/inference_results.csv | 2 - .../5/.hydra/config.yaml | 69 --- .../5/.hydra/hydra.yaml | 175 ------ .../5/.hydra/overrides.yaml | 2 - .../5/hydra_config.yaml | 69 --- .../5/inference_results.csv | 2 - .../2/.hydra/config.yaml | 69 --- .../2/.hydra/hydra.yaml | 175 ------ .../2/.hydra/overrides.yaml | 2 - .../2/hydra_config.yaml | 69 --- .../2/inference_results.csv | 2 - .../9/.hydra/config.yaml | 69 --- .../9/.hydra/hydra.yaml | 175 ------ .../9/.hydra/overrides.yaml | 2 - .../9/hydra_config.yaml | 69 --- .../9/inference_results.csv | 2 - .../6/.hydra/config.yaml | 69 --- .../6/.hydra/hydra.yaml | 175 ------ .../6/.hydra/overrides.yaml | 2 - .../6/hydra_config.yaml | 69 --- .../6/inference_results.csv | 2 - .../3/.hydra/config.yaml | 69 --- .../3/.hydra/hydra.yaml | 175 ------ .../3/.hydra/overrides.yaml | 2 - .../3/hydra_config.yaml | 69 --- .../3/inference_results.csv | 2 - .../multirun.yaml | 242 -------- .../0/.hydra/config.yaml | 79 --- .../0/.hydra/hydra.yaml | 175 ------ .../0/.hydra/overrides.yaml | 2 - .../0/hydra_config.yaml | 80 --- .../0/inference_results.csv | 2 - .../10/.hydra/config.yaml | 79 --- .../10/.hydra/hydra.yaml | 175 ------ .../10/.hydra/overrides.yaml | 2 - .../10/hydra_config.yaml | 80 --- .../10/inference_results.csv | 2 - .../7/.hydra/config.yaml | 79 --- .../7/.hydra/hydra.yaml | 175 ------ .../7/.hydra/overrides.yaml | 2 - .../7/hydra_config.yaml | 80 --- .../7/inference_results.csv | 2 - .../4/.hydra/config.yaml | 79 --- .../4/.hydra/hydra.yaml | 175 ------ .../4/.hydra/overrides.yaml | 2 - .../4/hydra_config.yaml | 80 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 79 --- .../1/.hydra/hydra.yaml | 175 ------ .../1/.hydra/overrides.yaml | 2 - .../1/hydra_config.yaml | 80 --- .../1/inference_results.csv | 2 - .../11/.hydra/config.yaml | 79 --- .../11/.hydra/hydra.yaml | 175 ------ .../11/.hydra/overrides.yaml | 2 - .../11/hydra_config.yaml | 80 --- .../11/inference_results.csv | 2 - .../8/.hydra/config.yaml | 79 --- .../8/.hydra/hydra.yaml | 175 ------ .../8/.hydra/overrides.yaml | 2 - .../8/hydra_config.yaml | 80 --- .../8/inference_results.csv | 2 - .../5/.hydra/config.yaml | 79 --- .../5/.hydra/hydra.yaml | 175 ------ .../5/.hydra/overrides.yaml | 2 - .../5/hydra_config.yaml | 80 --- .../5/inference_results.csv | 2 - .../2/.hydra/config.yaml | 79 --- .../2/.hydra/hydra.yaml | 175 ------ .../2/.hydra/overrides.yaml | 2 - .../2/hydra_config.yaml | 80 --- .../2/inference_results.csv | 2 - .../9/.hydra/config.yaml | 79 --- .../9/.hydra/hydra.yaml | 175 ------ .../9/.hydra/overrides.yaml | 2 - .../9/hydra_config.yaml | 80 --- .../9/inference_results.csv | 2 - .../6/.hydra/config.yaml | 79 --- .../6/.hydra/hydra.yaml | 175 ------ .../6/.hydra/overrides.yaml | 2 - .../6/hydra_config.yaml | 80 --- .../6/inference_results.csv | 2 - .../3/.hydra/config.yaml | 79 --- .../3/.hydra/hydra.yaml | 175 ------ .../3/.hydra/overrides.yaml | 2 - .../3/hydra_config.yaml | 80 --- .../3/inference_results.csv | 2 - .../multirun.yaml | 252 -------- .../0/.hydra/config.yaml | 80 --- .../0/.hydra/hydra.yaml | 175 ------ .../0/.hydra/overrides.yaml | 2 - .../0/hydra_config.yaml | 82 --- .../0/inference_results.csv | 2 - .../7/.hydra/config.yaml | 80 --- .../7/.hydra/hydra.yaml | 175 ------ .../7/.hydra/overrides.yaml | 2 - .../7/hydra_config.yaml | 82 --- .../7/inference_results.csv | 2 - .../4/.hydra/config.yaml | 80 --- .../4/.hydra/hydra.yaml | 175 ------ .../4/.hydra/overrides.yaml | 2 - .../4/hydra_config.yaml | 82 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 80 --- .../1/.hydra/hydra.yaml | 175 ------ .../1/.hydra/overrides.yaml | 2 - .../1/hydra_config.yaml | 82 --- .../1/inference_results.csv | 2 - .../8/.hydra/config.yaml | 80 --- .../8/.hydra/hydra.yaml | 175 ------ .../8/.hydra/overrides.yaml | 2 - .../8/hydra_config.yaml | 82 --- .../8/inference_results.csv | 2 - .../5/.hydra/config.yaml | 80 --- .../5/.hydra/hydra.yaml | 175 ------ .../5/.hydra/overrides.yaml | 2 - .../5/hydra_config.yaml | 82 --- .../5/inference_results.csv | 2 - .../2/.hydra/config.yaml | 80 --- .../2/.hydra/hydra.yaml | 175 ------ .../2/.hydra/overrides.yaml | 2 - .../2/hydra_config.yaml | 82 --- .../2/inference_results.csv | 2 - .../9/.hydra/config.yaml | 80 --- .../9/.hydra/hydra.yaml | 175 ------ .../9/.hydra/overrides.yaml | 2 - .../9/hydra_config.yaml | 82 --- .../6/.hydra/config.yaml | 80 --- .../6/.hydra/hydra.yaml | 175 ------ .../6/.hydra/overrides.yaml | 2 - .../6/hydra_config.yaml | 82 --- .../6/inference_results.csv | 2 - .../3/.hydra/config.yaml | 80 --- .../3/.hydra/hydra.yaml | 175 ------ .../3/.hydra/overrides.yaml | 2 - .../3/hydra_config.yaml | 82 --- .../3/inference_results.csv | 2 - .../multirun.yaml | 253 -------- .../3/.hydra/config.yaml | 69 --- .../3/.hydra/hydra.yaml | 175 ------ .../3/.hydra/overrides.yaml | 2 - .../3/hydra_config.yaml | 69 --- .../3/inference_results.csv | 2 - .../0/.hydra/config.yaml | 69 --- .../0/.hydra/hydra.yaml | 175 ------ .../0/.hydra/overrides.yaml | 2 - .../0/hydra_config.yaml | 69 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 69 --- .../4/.hydra/hydra.yaml | 175 ------ .../4/.hydra/overrides.yaml | 2 - .../4/hydra_config.yaml | 69 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 69 --- .../1/.hydra/hydra.yaml | 175 ------ .../1/.hydra/overrides.yaml | 2 - .../1/hydra_config.yaml | 69 --- .../1/inference_results.csv | 2 - .../5/.hydra/config.yaml | 69 --- .../5/.hydra/hydra.yaml | 175 ------ .../5/.hydra/overrides.yaml | 2 - .../5/hydra_config.yaml | 69 --- .../5/inference_results.csv | 2 - .../2/.hydra/config.yaml | 69 --- .../2/.hydra/hydra.yaml | 175 ------ .../2/.hydra/overrides.yaml | 2 - .../2/hydra_config.yaml | 69 --- .../2/inference_results.csv | 2 - .../multirun.yaml | 242 -------- .../3/.hydra/config.yaml | 79 --- .../3/.hydra/hydra.yaml | 175 ------ .../3/.hydra/overrides.yaml | 2 - .../3/hydra_config.yaml | 80 --- .../3/inference_results.csv | 2 - .../0/.hydra/config.yaml | 79 --- .../0/.hydra/hydra.yaml | 175 ------ .../0/.hydra/overrides.yaml | 2 - .../0/hydra_config.yaml | 80 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 79 --- .../4/.hydra/hydra.yaml | 175 ------ .../4/.hydra/overrides.yaml | 2 - .../4/hydra_config.yaml | 80 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 79 --- .../1/.hydra/hydra.yaml | 175 ------ .../1/.hydra/overrides.yaml | 2 - .../1/hydra_config.yaml | 80 --- .../1/inference_results.csv | 2 - .../5/.hydra/config.yaml | 79 --- .../5/.hydra/hydra.yaml | 175 ------ .../5/.hydra/overrides.yaml | 2 - .../5/hydra_config.yaml | 80 --- .../5/inference_results.csv | 2 - .../2/.hydra/config.yaml | 79 --- .../2/.hydra/hydra.yaml | 175 ------ .../2/.hydra/overrides.yaml | 2 - .../2/hydra_config.yaml | 80 --- .../2/inference_results.csv | 2 - .../multirun.yaml | 252 -------- .../3/.hydra/config.yaml | 80 --- .../3/.hydra/hydra.yaml | 175 ------ .../3/.hydra/overrides.yaml | 2 - .../3/hydra_config.yaml | 82 --- .../3/inference_results.csv | 2 - .../0/.hydra/config.yaml | 80 --- .../0/.hydra/hydra.yaml | 175 ------ .../0/.hydra/overrides.yaml | 2 - .../0/hydra_config.yaml | 82 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 80 --- .../4/.hydra/hydra.yaml | 175 ------ .../4/.hydra/overrides.yaml | 2 - .../4/hydra_config.yaml | 82 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 80 --- .../1/.hydra/hydra.yaml | 175 ------ .../1/.hydra/overrides.yaml | 2 - .../1/hydra_config.yaml | 82 --- .../1/inference_results.csv | 2 - .../5/.hydra/config.yaml | 80 --- .../5/.hydra/hydra.yaml | 175 ------ .../5/.hydra/overrides.yaml | 2 - .../5/hydra_config.yaml | 82 --- .../5/inference_results.csv | 2 - .../2/.hydra/config.yaml | 80 --- .../2/.hydra/hydra.yaml | 175 ------ .../2/.hydra/overrides.yaml | 2 - .../2/hydra_config.yaml | 82 --- .../2/inference_results.csv | 2 - .../multirun.yaml | 253 -------- examples/fast-mteb/report.py | 222 ------- examples/fast-mteb/script.sh | 7 - examples/openvino_diffusion.yaml | 3 +- examples/running-llamas/README.md | 66 --- .../Llama-13b/decode_throughput_bar_plot.png | Bin 41316 -> 0 bytes .../Llama-13b/decode_throughput_line_plot.png | Bin 64674 -> 0 bytes .../artifacts/Llama-13b/full_report.csv | 31 - ...generate_max_memory_allocated_bar_plot.png | Bin 44083 -> 0 bytes ...enerate_max_memory_allocated_line_plot.png | Bin 61570 -> 0 bytes .../generate_max_memory_reserved_bar_plot.png | Bin 46918 -> 0 bytes ...generate_max_memory_reserved_line_plot.png | Bin 61567 -> 0 bytes .../peak_decode_throughput_bar_plot.png | Bin 40338 -> 0 bytes .../Llama-13b/prefill_latency_bar_plot.png | Bin 36349 -> 0 bytes .../Llama-13b/prefill_latency_line_plot.png | Bin 59534 -> 0 bytes .../artifacts/Llama-13b/short_report.csv | 31 - .../Llama-65b/decode_throughput_bar_plot.png | Bin 32942 -> 0 bytes .../Llama-65b/decode_throughput_line_plot.png | Bin 43750 -> 0 bytes .../artifacts/Llama-65b/full_report.csv | 9 - ...generate_max_memory_allocated_bar_plot.png | Bin 39213 -> 0 bytes ...enerate_max_memory_allocated_line_plot.png | Bin 47608 -> 0 bytes .../generate_max_memory_reserved_bar_plot.png | Bin 39831 -> 0 bytes ...generate_max_memory_reserved_line_plot.png | Bin 48540 -> 0 bytes .../peak_decode_throughput_bar_plot.png | Bin 30405 -> 0 bytes .../Llama-65b/prefill_latency_bar_plot.png | Bin 30959 -> 0 bytes .../Llama-65b/prefill_latency_line_plot.png | Bin 41751 -> 0 bytes .../artifacts/Llama-65b/short_report.csv | 9 - .../Llama-7b/decode_throughput_bar_plot.png | Bin 41663 -> 0 bytes .../Llama-7b/decode_throughput_line_plot.png | Bin 70079 -> 0 bytes .../artifacts/Llama-7b/full_report.csv | 36 -- ...generate_max_memory_allocated_bar_plot.png | Bin 44722 -> 0 bytes ...enerate_max_memory_allocated_line_plot.png | Bin 64550 -> 0 bytes .../generate_max_memory_reserved_bar_plot.png | Bin 47072 -> 0 bytes ...generate_max_memory_reserved_line_plot.png | Bin 63481 -> 0 bytes .../peak_decode_throughput_bar_plot.png | Bin 40604 -> 0 bytes .../Llama-7b/prefill_latency_bar_plot.png | Bin 36913 -> 0 bytes .../Llama-7b/prefill_latency_line_plot.png | Bin 58741 -> 0 bytes .../artifacts/Llama-7b/short_report.csv | 36 -- examples/running-llamas/configs/_base_.yaml | 40 -- .../running-llamas/configs/fp16+bt+tp=2.yaml | 22 - examples/running-llamas/configs/fp16+bt.yaml | 9 - .../running-llamas/configs/fp16+dp=2.yaml | 15 - .../running-llamas/configs/fp16+fa2+tp=2.yaml | 22 - examples/running-llamas/configs/fp16+fa2.yaml | 9 - .../configs/fp16+gptq+exllamav1+dp=2.yaml | 27 - .../configs/fp16+gptq+exllamav1.yaml | 20 - .../configs/fp16+gptq+exllamav2+dp=2.yaml | 27 - .../configs/fp16+gptq+exllamav2.yaml | 20 - .../running-llamas/configs/fp16+tp=2.yaml | 21 - examples/running-llamas/configs/fp16.yaml | 6 - examples/running-llamas/report.py | 289 --------- examples/running-mistrals/README.md | 60 -- .../A100-80GB/forward_latency_plot.png | Bin 39767 -> 0 bytes .../A100-80GB/forward_memory_plot.png | Bin 44926 -> 0 bytes .../artifacts/A100-80GB/full_report.csv | 21 - .../A100-80GB/generate_memory_plot.png | Bin 45209 -> 0 bytes .../A100-80GB/generate_throughput_plot.png | Bin 50050 -> 0 bytes .../artifacts/A100-80GB/rich_table.svg | 235 -------- .../artifacts/A100-80GB/short_report.csv | 21 - examples/running-mistrals/configs/_base_.yaml | 36 -- examples/running-mistrals/configs/awq.yaml | 6 - examples/running-mistrals/configs/bnb.yaml | 11 - examples/running-mistrals/configs/gptq.yaml | 6 - .../0/.hydra/config.yaml | 71 --- .../0/.hydra/hydra.yaml | 174 ------ .../0/.hydra/overrides.yaml | 1 - .../0/hydra_config.yaml | 77 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 71 --- .../4/.hydra/hydra.yaml | 174 ------ .../4/.hydra/overrides.yaml | 1 - .../4/hydra_config.yaml | 77 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 71 --- .../1/.hydra/hydra.yaml | 174 ------ .../1/.hydra/overrides.yaml | 1 - .../1/hydra_config.yaml | 77 --- .../1/inference_results.csv | 2 - .../2/.hydra/config.yaml | 71 --- .../2/.hydra/hydra.yaml | 174 ------ .../2/.hydra/overrides.yaml | 1 - .../2/hydra_config.yaml | 77 --- .../2/inference_results.csv | 2 - .../3/.hydra/config.yaml | 71 --- .../3/.hydra/hydra.yaml | 174 ------ .../3/.hydra/overrides.yaml | 1 - .../3/hydra_config.yaml | 77 --- .../3/inference_results.csv | 2 - .../0/.hydra/config.yaml | 73 --- .../0/.hydra/hydra.yaml | 174 ------ .../0/.hydra/overrides.yaml | 1 - .../0/hydra_config.yaml | 80 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 73 --- .../4/.hydra/hydra.yaml | 174 ------ .../4/.hydra/overrides.yaml | 1 - .../4/hydra_config.yaml | 80 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 73 --- .../1/.hydra/hydra.yaml | 174 ------ .../1/.hydra/overrides.yaml | 1 - .../1/hydra_config.yaml | 80 --- .../1/inference_results.csv | 2 - .../2/.hydra/config.yaml | 73 --- .../2/.hydra/hydra.yaml | 174 ------ .../2/.hydra/overrides.yaml | 1 - .../2/hydra_config.yaml | 80 --- .../2/inference_results.csv | 2 - .../3/.hydra/config.yaml | 73 --- .../3/.hydra/hydra.yaml | 174 ------ .../3/.hydra/overrides.yaml | 1 - .../3/hydra_config.yaml | 80 --- .../3/inference_results.csv | 2 - .../0/.hydra/config.yaml | 70 --- .../0/.hydra/hydra.yaml | 174 ------ .../0/.hydra/overrides.yaml | 1 - .../0/hydra_config.yaml | 77 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 70 --- .../4/.hydra/hydra.yaml | 174 ------ .../4/.hydra/overrides.yaml | 1 - .../4/hydra_config.yaml | 77 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 70 --- .../1/.hydra/hydra.yaml | 174 ------ .../1/.hydra/overrides.yaml | 1 - .../1/hydra_config.yaml | 77 --- .../1/inference_results.csv | 2 - .../2/.hydra/config.yaml | 70 --- .../2/.hydra/hydra.yaml | 174 ------ .../2/.hydra/overrides.yaml | 1 - .../2/hydra_config.yaml | 77 --- .../2/inference_results.csv | 2 - .../3/.hydra/config.yaml | 70 --- .../3/.hydra/hydra.yaml | 174 ------ .../3/.hydra/overrides.yaml | 1 - .../3/hydra_config.yaml | 77 --- .../3/inference_results.csv | 2 - .../multirun.yaml | 243 -------- .../0/.hydra/config.yaml | 71 --- .../0/.hydra/hydra.yaml | 174 ------ .../0/.hydra/overrides.yaml | 1 - .../0/hydra_config.yaml | 77 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 71 --- .../4/.hydra/hydra.yaml | 174 ------ .../4/.hydra/overrides.yaml | 1 - .../4/hydra_config.yaml | 77 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 71 --- .../1/.hydra/hydra.yaml | 174 ------ .../1/.hydra/overrides.yaml | 1 - .../1/hydra_config.yaml | 77 --- .../1/inference_results.csv | 2 - .../2/.hydra/config.yaml | 71 --- .../2/.hydra/hydra.yaml | 174 ------ .../2/.hydra/overrides.yaml | 1 - .../2/hydra_config.yaml | 77 --- .../2/inference_results.csv | 2 - .../3/.hydra/config.yaml | 71 --- .../3/.hydra/hydra.yaml | 174 ------ .../3/.hydra/overrides.yaml | 1 - .../3/hydra_config.yaml | 77 --- .../3/inference_results.csv | 2 - examples/running-mistrals/report.py | 229 ------- examples/running-vicunas/README.md | 61 -- .../A100-80GB/forward_latency_plot.png | Bin 52063 -> 0 bytes .../A100-80GB/forward_memory_plot.png | Bin 44235 -> 0 bytes .../artifacts/A100-80GB/full_report.csv | 26 - .../A100-80GB/generate_memory_plot.png | Bin 51647 -> 0 bytes .../A100-80GB/generate_throughput_plot.png | Bin 58622 -> 0 bytes .../artifacts/A100-80GB/rich_table.svg | 275 --------- .../artifacts/A100-80GB/short_report.csv | 26 - examples/running-vicunas/configs/_base_.yaml | 36 -- .../running-vicunas/configs/awq+gemm.yaml | 6 - .../running-vicunas/configs/awq+gemv.yaml | 6 - examples/running-vicunas/configs/bnb.yaml | 11 - examples/running-vicunas/configs/gptq.yaml | 6 - .../0/.hydra/config.yaml | 70 --- .../0/.hydra/hydra.yaml | 174 ------ .../0/.hydra/overrides.yaml | 1 - .../0/hydra_config.yaml | 76 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 70 --- .../4/.hydra/hydra.yaml | 174 ------ .../4/.hydra/overrides.yaml | 1 - .../4/hydra_config.yaml | 76 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 70 --- .../1/.hydra/hydra.yaml | 174 ------ .../1/.hydra/overrides.yaml | 1 - .../1/hydra_config.yaml | 76 --- .../1/inference_results.csv | 2 - .../2/.hydra/config.yaml | 70 --- .../2/.hydra/hydra.yaml | 174 ------ .../2/.hydra/overrides.yaml | 1 - .../2/hydra_config.yaml | 76 --- .../2/inference_results.csv | 2 - .../3/.hydra/config.yaml | 70 --- .../3/.hydra/hydra.yaml | 174 ------ .../3/.hydra/overrides.yaml | 1 - .../3/hydra_config.yaml | 76 --- .../3/inference_results.csv | 2 - .../0/.hydra/config.yaml | 70 --- .../0/.hydra/hydra.yaml | 174 ------ .../0/.hydra/overrides.yaml | 1 - .../0/hydra_config.yaml | 76 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 70 --- .../4/.hydra/hydra.yaml | 174 ------ .../4/.hydra/overrides.yaml | 1 - .../4/hydra_config.yaml | 76 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 70 --- .../1/.hydra/hydra.yaml | 174 ------ .../1/.hydra/overrides.yaml | 1 - .../1/hydra_config.yaml | 76 --- .../1/inference_results.csv | 2 - .../2/.hydra/config.yaml | 70 --- .../2/.hydra/hydra.yaml | 174 ------ .../2/.hydra/overrides.yaml | 1 - .../2/hydra_config.yaml | 76 --- .../2/inference_results.csv | 2 - .../3/.hydra/config.yaml | 70 --- .../3/.hydra/hydra.yaml | 174 ------ .../3/.hydra/overrides.yaml | 1 - .../3/hydra_config.yaml | 76 --- .../3/inference_results.csv | 2 - .../0/.hydra/config.yaml | 72 --- .../0/.hydra/hydra.yaml | 174 ------ .../0/.hydra/overrides.yaml | 1 - .../0/hydra_config.yaml | 79 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 72 --- .../4/.hydra/hydra.yaml | 174 ------ .../4/.hydra/overrides.yaml | 1 - .../4/hydra_config.yaml | 79 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 72 --- .../1/.hydra/hydra.yaml | 174 ------ .../1/.hydra/overrides.yaml | 1 - .../1/hydra_config.yaml | 79 --- .../1/inference_results.csv | 2 - .../2/.hydra/config.yaml | 72 --- .../2/.hydra/hydra.yaml | 174 ------ .../2/.hydra/overrides.yaml | 1 - .../2/hydra_config.yaml | 79 --- .../2/inference_results.csv | 2 - .../3/.hydra/config.yaml | 72 --- .../3/.hydra/hydra.yaml | 174 ------ .../3/.hydra/overrides.yaml | 1 - .../3/hydra_config.yaml | 79 --- .../3/inference_results.csv | 2 - .../0/.hydra/config.yaml | 70 --- .../0/.hydra/hydra.yaml | 174 ------ .../0/.hydra/overrides.yaml | 1 - .../0/hydra_config.yaml | 76 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 70 --- .../4/.hydra/hydra.yaml | 174 ------ .../4/.hydra/overrides.yaml | 1 - .../4/hydra_config.yaml | 76 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 70 --- .../1/.hydra/hydra.yaml | 174 ------ .../1/.hydra/overrides.yaml | 1 - .../1/hydra_config.yaml | 76 --- .../1/inference_results.csv | 2 - .../2/.hydra/config.yaml | 70 --- .../2/.hydra/hydra.yaml | 174 ------ .../2/.hydra/overrides.yaml | 1 - .../2/hydra_config.yaml | 76 --- .../2/inference_results.csv | 2 - .../3/.hydra/config.yaml | 70 --- .../3/.hydra/hydra.yaml | 174 ------ .../3/.hydra/overrides.yaml | 1 - .../3/hydra_config.yaml | 76 --- .../3/inference_results.csv | 2 - .../0/.hydra/config.yaml | 70 --- .../0/.hydra/hydra.yaml | 174 ------ .../0/.hydra/overrides.yaml | 1 - .../0/hydra_config.yaml | 76 --- .../0/inference_results.csv | 2 - .../4/.hydra/config.yaml | 70 --- .../4/.hydra/hydra.yaml | 174 ------ .../4/.hydra/overrides.yaml | 1 - .../4/hydra_config.yaml | 76 --- .../4/inference_results.csv | 2 - .../1/.hydra/config.yaml | 70 --- .../1/.hydra/hydra.yaml | 174 ------ .../1/.hydra/overrides.yaml | 1 - .../1/hydra_config.yaml | 76 --- .../1/inference_results.csv | 2 - .../2/.hydra/config.yaml | 70 --- .../2/.hydra/hydra.yaml | 174 ------ .../2/.hydra/overrides.yaml | 1 - .../2/hydra_config.yaml | 76 --- .../2/inference_results.csv | 2 - .../3/.hydra/config.yaml | 70 --- .../3/.hydra/hydra.yaml | 174 ------ .../3/.hydra/overrides.yaml | 1 - .../3/hydra_config.yaml | 76 --- .../3/inference_results.csv | 2 - examples/running-vicunas/report.py | 231 -------- examples/training-llamas/README.md | 54 -- .../artifacts/Llama-2-13b-hf/full_report.csv | 393 ------------ .../peak_training_throughput.png | Bin 37616 -> 0 bytes .../artifacts/Llama-2-13b-hf/short_report.csv | 15 - .../training_throughput_bar_plot.png | Bin 32054 -> 0 bytes .../training_throughput_line_plot.png | Bin 47250 -> 0 bytes .../artifacts/Llama-2-7b-hf/full_report.csv | 561 ------------------ .../peak_training_throughput.png | Bin 40152 -> 0 bytes .../artifacts/Llama-2-7b-hf/short_report.csv | 21 - .../training_throughput_bar_plot.png | Bin 37158 -> 0 bytes .../training_throughput_line_plot.png | Bin 61746 -> 0 bytes examples/training-llamas/configs/_base_.yaml | 41 -- .../training-llamas/configs/fp16+dp=2.yaml | 15 - .../training-llamas/configs/fp16+fsdp=2.yaml | 19 - .../configs/fp16+peft+bnb-4bit+dp=2.yaml | 24 - .../configs/fp16+peft+bnb-4bit.yaml | 15 - .../configs/fp16+peft+dp=2+zero3.yaml | 28 - .../configs/fp16+peft+dp=2.yaml | 20 - .../configs/fp16+peft+gptq-4bit+dp=2.yaml | 16 - .../configs/fp16+peft+gptq-4bit.yaml | 16 - .../training-llamas/configs/fp16+peft.yaml | 11 - examples/training-llamas/configs/fp16.yaml | 6 - examples/training-llamas/report.py | 242 -------- examples/whisper/README.md | 72 --- .../whisper/configs/whisper_auto_opt+qnt.yaml | 13 - .../whisper/configs/whisper_auto_opt.yaml | 16 - .../whisper/configs/whisper_auto_qnt.yaml | 12 - .../whisper/configs/whisper_baseline.yaml | 29 - .../5/.hydra/config.yaml | 110 ---- .../5/.hydra/hydra.yaml | 177 ------ .../5/.hydra/overrides.yaml | 4 - .../5/hydra_config.yaml | 109 ---- .../5/inference_results.csv | 2 - .../whisper_auto_opt(O1)/6/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O1)/6/.hydra/hydra.yaml | 177 ------ .../6/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O1)/6/hydra_config.yaml | 109 ---- .../6/inference_results.csv | 2 - .../whisper_auto_opt(O2)/7/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O2)/7/.hydra/hydra.yaml | 177 ------ .../7/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O2)/7/hydra_config.yaml | 109 ---- .../7/inference_results.csv | 2 - .../whisper_auto_opt(O3)/8/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O3)/8/.hydra/hydra.yaml | 177 ------ .../8/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O3)/8/hydra_config.yaml | 109 ---- .../8/inference_results.csv | 2 - .../whisper_auto_opt(O4)/9/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O4)/9/.hydra/hydra.yaml | 177 ------ .../9/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O4)/9/hydra_config.yaml | 109 ---- .../9/inference_results.csv | 2 - .../15/.hydra/config.yaml | 110 ---- .../15/.hydra/hydra.yaml | 177 ------ .../15/.hydra/overrides.yaml | 4 - .../15/hydra_config.yaml | 109 ---- .../15/inference_results.csv | 2 - .../16/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O1)/16/.hydra/hydra.yaml | 177 ------ .../16/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O1)/16/hydra_config.yaml | 109 ---- .../16/inference_results.csv | 2 - .../17/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O2)/17/.hydra/hydra.yaml | 177 ------ .../17/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O2)/17/hydra_config.yaml | 109 ---- .../17/inference_results.csv | 2 - .../18/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O3)/18/.hydra/hydra.yaml | 177 ------ .../18/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O3)/18/hydra_config.yaml | 109 ---- .../18/inference_results.csv | 2 - .../19/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O4)/19/.hydra/hydra.yaml | 177 ------ .../19/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O4)/19/hydra_config.yaml | 109 ---- .../19/inference_results.csv | 2 - .../0/.hydra/config.yaml | 110 ---- .../0/.hydra/hydra.yaml | 177 ------ .../0/.hydra/overrides.yaml | 4 - .../0/hydra_config.yaml | 109 ---- .../0/inference_results.csv | 2 - .../whisper_auto_opt(O1)/1/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O1)/1/.hydra/hydra.yaml | 177 ------ .../1/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O1)/1/hydra_config.yaml | 109 ---- .../1/inference_results.csv | 2 - .../whisper_auto_opt(O2)/2/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O2)/2/.hydra/hydra.yaml | 177 ------ .../2/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O2)/2/hydra_config.yaml | 109 ---- .../2/inference_results.csv | 2 - .../whisper_auto_opt(O3)/3/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O3)/3/.hydra/hydra.yaml | 177 ------ .../3/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O3)/3/hydra_config.yaml | 109 ---- .../3/inference_results.csv | 2 - .../whisper_auto_opt(O4)/4/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O4)/4/.hydra/hydra.yaml | 177 ------ .../4/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O4)/4/hydra_config.yaml | 109 ---- .../4/inference_results.csv | 2 - .../10/.hydra/config.yaml | 110 ---- .../10/.hydra/hydra.yaml | 177 ------ .../10/.hydra/overrides.yaml | 4 - .../10/hydra_config.yaml | 109 ---- .../10/inference_results.csv | 2 - .../11/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O1)/11/.hydra/hydra.yaml | 177 ------ .../11/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O1)/11/hydra_config.yaml | 109 ---- .../11/inference_results.csv | 2 - .../12/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O2)/12/.hydra/hydra.yaml | 177 ------ .../12/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O2)/12/hydra_config.yaml | 109 ---- .../12/inference_results.csv | 2 - .../13/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O3)/13/.hydra/hydra.yaml | 177 ------ .../13/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O3)/13/hydra_config.yaml | 109 ---- .../13/inference_results.csv | 2 - .../14/.hydra/config.yaml | 110 ---- .../whisper_auto_opt(O4)/14/.hydra/hydra.yaml | 177 ------ .../14/.hydra/overrides.yaml | 4 - .../whisper_auto_opt(O4)/14/hydra_config.yaml | 109 ---- .../14/inference_results.csv | 2 - .../whisper_baseline/1/.hydra/config.yaml | 66 --- .../whisper_baseline/1/.hydra/hydra.yaml | 175 ------ .../whisper_baseline/1/.hydra/overrides.yaml | 3 - .../whisper_baseline/1/hydra_config.yaml | 66 --- .../whisper_baseline/1/inference_results.csv | 2 - .../whisper_baseline/3/.hydra/config.yaml | 66 --- .../whisper_baseline/3/.hydra/hydra.yaml | 175 ------ .../whisper_baseline/3/.hydra/overrides.yaml | 3 - .../whisper_baseline/3/hydra_config.yaml | 66 --- .../whisper_baseline/3/inference_results.csv | 2 - .../whisper_baseline/0/.hydra/config.yaml | 66 --- .../whisper_baseline/0/.hydra/hydra.yaml | 175 ------ .../whisper_baseline/0/.hydra/overrides.yaml | 3 - .../whisper_baseline/0/hydra_config.yaml | 66 --- .../whisper_baseline/0/inference_results.csv | 2 - .../whisper_baseline/2/.hydra/config.yaml | 66 --- .../whisper_baseline/2/.hydra/hydra.yaml | 175 ------ .../whisper_baseline/2/.hydra/overrides.yaml | 3 - .../whisper_baseline/2/hydra_config.yaml | 66 --- .../whisper_baseline/2/inference_results.csv | 2 - .../cuda_128_10/forward_throughput.png | Bin 57908 -> 0 bytes .../cuda_128_10/generate_throughput.png | Bin 61251 -> 0 bytes .../reports/cuda_128_10/inference_report.csv | 7 - .../reports/cuda_128_10/rich_table.svg | 129 ---- .../cuda_128_100/forward_throughput.png | Bin 58341 -> 0 bytes .../cuda_128_100/generate_throughput.png | Bin 60528 -> 0 bytes .../reports/cuda_128_100/inference_report.csv | 7 - .../reports/cuda_128_100/rich_table.svg | 129 ---- .../reports/cuda_64_10/forward_throughput.png | Bin 57810 -> 0 bytes .../cuda_64_10/generate_throughput.png | Bin 60243 -> 0 bytes .../reports/cuda_64_10/inference_report.csv | 7 - .../whisper/reports/cuda_64_10/rich_table.svg | 129 ---- .../cuda_64_100/forward_throughput.png | Bin 58139 -> 0 bytes .../cuda_64_100/generate_throughput.png | Bin 59021 -> 0 bytes .../reports/cuda_64_100/inference_report.csv | 7 - .../reports/cuda_64_100/rich_table.svg | 129 ---- examples/whisper/scripts/benchmark.sh | 10 - examples/whisper/scripts/report.sh | 11 - 750 files changed, 6 insertions(+), 48109 deletions(-) delete mode 100644 examples/fast-mteb/README.md delete mode 100644 examples/fast-mteb/artifacts/forward_latency_plot.png delete mode 100644 examples/fast-mteb/artifacts/forward_throughput_plot.png delete mode 100644 examples/fast-mteb/artifacts/full_report.csv delete mode 100644 examples/fast-mteb/artifacts/rich_table.svg delete mode 100644 examples/fast-mteb/artifacts/short_report.csv delete mode 100644 examples/fast-mteb/configs/bge_base_config.yaml delete mode 100644 examples/fast-mteb/configs/bge_batch_size_sweep_baseline.yaml delete mode 100644 examples/fast-mteb/configs/bge_batch_size_sweep_ort_cuda_o4.yaml delete mode 100644 examples/fast-mteb/configs/bge_batch_size_sweep_ort_trt_fp16.yaml delete mode 100644 examples/fast-mteb/configs/bge_seq_len_sweep_baseline.yaml delete mode 100644 examples/fast-mteb/configs/bge_seq_len_sweep_ort_cuda_o4.yaml delete mode 100644 examples/fast-mteb/configs/bge_seq_len_sweep_ort_trt_fp16.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1)_sequence_length(256)/0/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1)_sequence_length(256)/0/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1)_sequence_length(256)/0/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1)_sequence_length(256)/0/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1)_sequence_length(256)/0/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1024)_sequence_length(256)/10/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1024)_sequence_length(256)/10/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1024)_sequence_length(256)/10/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1024)_sequence_length(256)/10/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(1024)_sequence_length(256)/10/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(128)_sequence_length(256)/7/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(128)_sequence_length(256)/7/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(128)_sequence_length(256)/7/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(128)_sequence_length(256)/7/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(128)_sequence_length(256)/7/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(16)_sequence_length(256)/4/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(16)_sequence_length(256)/4/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(16)_sequence_length(256)/4/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(16)_sequence_length(256)/4/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(16)_sequence_length(256)/4/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2)_sequence_length(256)/1/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2)_sequence_length(256)/1/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2)_sequence_length(256)/1/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2)_sequence_length(256)/1/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2)_sequence_length(256)/1/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2048)_sequence_length(256)/11/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2048)_sequence_length(256)/11/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2048)_sequence_length(256)/11/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2048)_sequence_length(256)/11/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(2048)_sequence_length(256)/11/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(256)_sequence_length(256)/8/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(256)_sequence_length(256)/8/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(256)_sequence_length(256)/8/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(256)_sequence_length(256)/8/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(256)_sequence_length(256)/8/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(32)_sequence_length(256)/5/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(32)_sequence_length(256)/5/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(32)_sequence_length(256)/5/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(32)_sequence_length(256)/5/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(32)_sequence_length(256)/5/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(4)_sequence_length(256)/2/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(4)_sequence_length(256)/2/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(4)_sequence_length(256)/2/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(4)_sequence_length(256)/2/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(4)_sequence_length(256)/2/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(512)_sequence_length(256)/9/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(512)_sequence_length(256)/9/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(512)_sequence_length(256)/9/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(512)_sequence_length(256)/9/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(512)_sequence_length(256)/9/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(64)_sequence_length(256)/6/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(64)_sequence_length(256)/6/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(64)_sequence_length(256)/6/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(64)_sequence_length(256)/6/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(64)_sequence_length(256)/6/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(8)_sequence_length(256)/3/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(8)_sequence_length(256)/3/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(8)_sequence_length(256)/3/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(8)_sequence_length(256)/3/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(8)_sequence_length(256)/3/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_baseline_batch_size(None)_sequence_length(None)/multirun.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/0/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/0/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/0/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/0/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/0/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1024)_sequence_length(256)/10/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1024)_sequence_length(256)/10/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1024)_sequence_length(256)/10/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1024)_sequence_length(256)/10/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(1024)_sequence_length(256)/10/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(128)_sequence_length(256)/7/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(128)_sequence_length(256)/7/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(128)_sequence_length(256)/7/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(128)_sequence_length(256)/7/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(128)_sequence_length(256)/7/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(16)_sequence_length(256)/4/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(16)_sequence_length(256)/4/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(16)_sequence_length(256)/4/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(16)_sequence_length(256)/4/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(16)_sequence_length(256)/4/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2)_sequence_length(256)/1/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2)_sequence_length(256)/1/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2)_sequence_length(256)/1/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2)_sequence_length(256)/1/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2)_sequence_length(256)/1/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2048)_sequence_length(256)/11/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2048)_sequence_length(256)/11/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2048)_sequence_length(256)/11/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2048)_sequence_length(256)/11/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(2048)_sequence_length(256)/11/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(256)_sequence_length(256)/8/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(256)_sequence_length(256)/8/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(256)_sequence_length(256)/8/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(256)_sequence_length(256)/8/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(256)_sequence_length(256)/8/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(32)_sequence_length(256)/5/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(32)_sequence_length(256)/5/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(32)_sequence_length(256)/5/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(32)_sequence_length(256)/5/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(32)_sequence_length(256)/5/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(4)_sequence_length(256)/2/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(4)_sequence_length(256)/2/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(4)_sequence_length(256)/2/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(4)_sequence_length(256)/2/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(4)_sequence_length(256)/2/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(512)_sequence_length(256)/9/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(512)_sequence_length(256)/9/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(512)_sequence_length(256)/9/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(512)_sequence_length(256)/9/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(512)_sequence_length(256)/9/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(64)_sequence_length(256)/6/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(64)_sequence_length(256)/6/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(64)_sequence_length(256)/6/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(64)_sequence_length(256)/6/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(64)_sequence_length(256)/6/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(8)_sequence_length(256)/3/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(8)_sequence_length(256)/3/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(8)_sequence_length(256)/3/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(8)_sequence_length(256)/3/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(8)_sequence_length(256)/3/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_cuda_o4_batch_size(None)_sequence_length(None)/multirun.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/0/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/0/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/0/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/0/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/0/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(128)_sequence_length(256)/7/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(128)_sequence_length(256)/7/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(128)_sequence_length(256)/7/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(128)_sequence_length(256)/7/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(128)_sequence_length(256)/7/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(16)_sequence_length(256)/4/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(16)_sequence_length(256)/4/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(16)_sequence_length(256)/4/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(16)_sequence_length(256)/4/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(16)_sequence_length(256)/4/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(2)_sequence_length(256)/1/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(2)_sequence_length(256)/1/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(2)_sequence_length(256)/1/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(2)_sequence_length(256)/1/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(2)_sequence_length(256)/1/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(256)_sequence_length(256)/8/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(256)_sequence_length(256)/8/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(256)_sequence_length(256)/8/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(256)_sequence_length(256)/8/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(256)_sequence_length(256)/8/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(32)_sequence_length(256)/5/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(32)_sequence_length(256)/5/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(32)_sequence_length(256)/5/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(32)_sequence_length(256)/5/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(32)_sequence_length(256)/5/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(4)_sequence_length(256)/2/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(4)_sequence_length(256)/2/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(4)_sequence_length(256)/2/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(4)_sequence_length(256)/2/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(4)_sequence_length(256)/2/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(512)_sequence_length(256)/9/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(512)_sequence_length(256)/9/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(512)_sequence_length(256)/9/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(512)_sequence_length(256)/9/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(64)_sequence_length(256)/6/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(64)_sequence_length(256)/6/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(64)_sequence_length(256)/6/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(64)_sequence_length(256)/6/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(64)_sequence_length(256)/6/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(8)_sequence_length(256)/3/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(8)_sequence_length(256)/3/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(8)_sequence_length(256)/3/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(8)_sequence_length(256)/3/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(8)_sequence_length(256)/3/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_batch_size_sweep_ort_trt_fp16_batch_size(None)_sequence_length(None)/multirun.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(128)/3/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(128)/3/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(128)/3/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(128)/3/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(128)/3/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(16)/0/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(16)/0/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(16)/0/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(16)/0/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(16)/0/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(256)/4/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(256)/4/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(256)/4/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(256)/4/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(256)/4/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(32)/1/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(32)/1/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(32)/1/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(32)/1/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(32)/1/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(512)/5/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(512)/5/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(512)/5/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(512)/5/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(512)/5/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(64)/2/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(64)/2/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(64)/2/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(64)/2/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(1)_sequence_length(64)/2/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_baseline_batch_size(None)_sequence_length(None)/multirun.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(128)/3/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(128)/3/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(128)/3/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(128)/3/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(128)/3/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(16)/0/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(16)/0/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(16)/0/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(16)/0/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(16)/0/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/4/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/4/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/4/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/4/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(256)/4/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(32)/1/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(32)/1/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(32)/1/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(32)/1/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(32)/1/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(512)/5/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(512)/5/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(512)/5/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(512)/5/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(512)/5/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(64)/2/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(64)/2/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(64)/2/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(64)/2/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(1)_sequence_length(64)/2/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_cuda_o4_batch_size(None)_sequence_length(None)/multirun.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(128)/3/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(128)/3/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(128)/3/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(128)/3/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(128)/3/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(16)/0/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(16)/0/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(16)/0/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(16)/0/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(16)/0/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/4/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/4/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/4/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/4/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(256)/4/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(32)/1/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(32)/1/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(32)/1/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(32)/1/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(32)/1/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(512)/5/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(512)/5/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(512)/5/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(512)/5/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(512)/5/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(64)/2/.hydra/config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(64)/2/.hydra/hydra.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(64)/2/.hydra/overrides.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(64)/2/hydra_config.yaml delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(1)_sequence_length(64)/2/inference_results.csv delete mode 100644 examples/fast-mteb/experiments/bge_seq_len_sweep_ort_trt_fp16_batch_size(None)_sequence_length(None)/multirun.yaml delete mode 100644 examples/fast-mteb/report.py delete mode 100644 examples/fast-mteb/script.sh delete mode 100644 examples/running-llamas/README.md delete mode 100644 examples/running-llamas/artifacts/Llama-13b/decode_throughput_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-13b/decode_throughput_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-13b/full_report.csv delete mode 100644 examples/running-llamas/artifacts/Llama-13b/generate_max_memory_allocated_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-13b/generate_max_memory_allocated_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-13b/generate_max_memory_reserved_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-13b/generate_max_memory_reserved_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-13b/peak_decode_throughput_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-13b/prefill_latency_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-13b/prefill_latency_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-13b/short_report.csv delete mode 100644 examples/running-llamas/artifacts/Llama-65b/decode_throughput_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-65b/decode_throughput_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-65b/full_report.csv delete mode 100644 examples/running-llamas/artifacts/Llama-65b/generate_max_memory_allocated_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-65b/generate_max_memory_allocated_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-65b/generate_max_memory_reserved_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-65b/generate_max_memory_reserved_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-65b/peak_decode_throughput_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-65b/prefill_latency_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-65b/prefill_latency_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-65b/short_report.csv delete mode 100644 examples/running-llamas/artifacts/Llama-7b/decode_throughput_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-7b/decode_throughput_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-7b/full_report.csv delete mode 100644 examples/running-llamas/artifacts/Llama-7b/generate_max_memory_allocated_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-7b/generate_max_memory_allocated_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-7b/generate_max_memory_reserved_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-7b/generate_max_memory_reserved_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-7b/peak_decode_throughput_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-7b/prefill_latency_bar_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-7b/prefill_latency_line_plot.png delete mode 100644 examples/running-llamas/artifacts/Llama-7b/short_report.csv delete mode 100644 examples/running-llamas/configs/_base_.yaml delete mode 100644 examples/running-llamas/configs/fp16+bt+tp=2.yaml delete mode 100644 examples/running-llamas/configs/fp16+bt.yaml delete mode 100644 examples/running-llamas/configs/fp16+dp=2.yaml delete mode 100644 examples/running-llamas/configs/fp16+fa2+tp=2.yaml delete mode 100644 examples/running-llamas/configs/fp16+fa2.yaml delete mode 100644 examples/running-llamas/configs/fp16+gptq+exllamav1+dp=2.yaml delete mode 100644 examples/running-llamas/configs/fp16+gptq+exllamav1.yaml delete mode 100644 examples/running-llamas/configs/fp16+gptq+exllamav2+dp=2.yaml delete mode 100644 examples/running-llamas/configs/fp16+gptq+exllamav2.yaml delete mode 100644 examples/running-llamas/configs/fp16+tp=2.yaml delete mode 100644 examples/running-llamas/configs/fp16.yaml delete mode 100644 examples/running-llamas/report.py delete mode 100644 examples/running-mistrals/README.md delete mode 100644 examples/running-mistrals/artifacts/A100-80GB/forward_latency_plot.png delete mode 100644 examples/running-mistrals/artifacts/A100-80GB/forward_memory_plot.png delete mode 100644 examples/running-mistrals/artifacts/A100-80GB/full_report.csv delete mode 100644 examples/running-mistrals/artifacts/A100-80GB/generate_memory_plot.png delete mode 100644 examples/running-mistrals/artifacts/A100-80GB/generate_throughput_plot.png delete mode 100644 examples/running-mistrals/artifacts/A100-80GB/rich_table.svg delete mode 100644 examples/running-mistrals/artifacts/A100-80GB/short_report.csv delete mode 100644 examples/running-mistrals/configs/_base_.yaml delete mode 100644 examples/running-mistrals/configs/awq.yaml delete mode 100644 examples/running-mistrals/configs/bnb.yaml delete mode 100644 examples/running-mistrals/configs/gptq.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/awq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/fp16-batch_size(None)-sequence_length(512)-new_tokens(1000)/multirun.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(512)-new_tokens(1000)/0/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(512)-new_tokens(1000)/4/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(512)-new_tokens(1000)/1/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(512)-new_tokens(1000)/2/inference_results.csv delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/hydra.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/.hydra/overrides.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/hydra_config.yaml delete mode 100644 examples/running-mistrals/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(512)-new_tokens(1000)/3/inference_results.csv delete mode 100644 examples/running-mistrals/report.py delete mode 100644 examples/running-vicunas/README.md delete mode 100644 examples/running-vicunas/artifacts/A100-80GB/forward_latency_plot.png delete mode 100644 examples/running-vicunas/artifacts/A100-80GB/forward_memory_plot.png delete mode 100644 examples/running-vicunas/artifacts/A100-80GB/full_report.csv delete mode 100644 examples/running-vicunas/artifacts/A100-80GB/generate_memory_plot.png delete mode 100644 examples/running-vicunas/artifacts/A100-80GB/generate_throughput_plot.png delete mode 100644 examples/running-vicunas/artifacts/A100-80GB/rich_table.svg delete mode 100644 examples/running-vicunas/artifacts/A100-80GB/short_report.csv delete mode 100644 examples/running-vicunas/configs/_base_.yaml delete mode 100644 examples/running-vicunas/configs/awq+gemm.yaml delete mode 100644 examples/running-vicunas/configs/awq+gemv.yaml delete mode 100644 examples/running-vicunas/configs/bnb.yaml delete mode 100644 examples/running-vicunas/configs/gptq.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(1)-sequence_length(128)-new_tokens(256)/0/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(1)-sequence_length(128)-new_tokens(256)/0/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(16)-sequence_length(128)-new_tokens(256)/4/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(16)-sequence_length(128)-new_tokens(256)/4/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(2)-sequence_length(128)-new_tokens(256)/1/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(2)-sequence_length(128)-new_tokens(256)/1/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(4)-sequence_length(128)-new_tokens(256)/2/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(4)-sequence_length(128)-new_tokens(256)/2/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(8)-sequence_length(128)-new_tokens(256)/3/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemm-batch_size(8)-sequence_length(128)-new_tokens(256)/3/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(1)-sequence_length(128)-new_tokens(256)/0/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(1)-sequence_length(128)-new_tokens(256)/0/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(16)-sequence_length(128)-new_tokens(256)/4/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(16)-sequence_length(128)-new_tokens(256)/4/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(2)-sequence_length(128)-new_tokens(256)/1/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(2)-sequence_length(128)-new_tokens(256)/1/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(4)-sequence_length(128)-new_tokens(256)/2/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(4)-sequence_length(128)-new_tokens(256)/2/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(8)-sequence_length(128)-new_tokens(256)/3/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/awq+gemv-batch_size(8)-sequence_length(128)-new_tokens(256)/3/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(128)-new_tokens(256)/0/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(1)-sequence_length(128)-new_tokens(256)/0/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(128)-new_tokens(256)/4/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(16)-sequence_length(128)-new_tokens(256)/4/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(128)-new_tokens(256)/1/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(2)-sequence_length(128)-new_tokens(256)/1/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(128)-new_tokens(256)/2/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(4)-sequence_length(128)-new_tokens(256)/2/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(128)-new_tokens(256)/3/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/bnb-batch_size(8)-sequence_length(128)-new_tokens(256)/3/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(128)-new_tokens(256)/0/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(1)-sequence_length(128)-new_tokens(256)/0/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(128)-new_tokens(256)/4/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(16)-sequence_length(128)-new_tokens(256)/4/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(128)-new_tokens(256)/1/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(2)-sequence_length(128)-new_tokens(256)/1/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(128)-new_tokens(256)/2/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(4)-sequence_length(128)-new_tokens(256)/2/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(128)-new_tokens(256)/3/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/fp16-batch_size(8)-sequence_length(128)-new_tokens(256)/3/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(128)-new_tokens(256)/0/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(128)-new_tokens(256)/0/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(1)-sequence_length(128)-new_tokens(256)/0/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(128)-new_tokens(256)/4/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(128)-new_tokens(256)/4/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(16)-sequence_length(128)-new_tokens(256)/4/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(128)-new_tokens(256)/1/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(128)-new_tokens(256)/1/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(2)-sequence_length(128)-new_tokens(256)/1/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(128)-new_tokens(256)/2/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(128)-new_tokens(256)/2/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(4)-sequence_length(128)-new_tokens(256)/2/inference_results.csv delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/hydra.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(128)-new_tokens(256)/3/.hydra/overrides.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(128)-new_tokens(256)/3/hydra_config.yaml delete mode 100644 examples/running-vicunas/experiments/A100-80GB/gptq-batch_size(8)-sequence_length(128)-new_tokens(256)/3/inference_results.csv delete mode 100644 examples/running-vicunas/report.py delete mode 100644 examples/training-llamas/README.md delete mode 100644 examples/training-llamas/artifacts/Llama-2-13b-hf/full_report.csv delete mode 100644 examples/training-llamas/artifacts/Llama-2-13b-hf/peak_training_throughput.png delete mode 100644 examples/training-llamas/artifacts/Llama-2-13b-hf/short_report.csv delete mode 100644 examples/training-llamas/artifacts/Llama-2-13b-hf/training_throughput_bar_plot.png delete mode 100644 examples/training-llamas/artifacts/Llama-2-13b-hf/training_throughput_line_plot.png delete mode 100644 examples/training-llamas/artifacts/Llama-2-7b-hf/full_report.csv delete mode 100644 examples/training-llamas/artifacts/Llama-2-7b-hf/peak_training_throughput.png delete mode 100644 examples/training-llamas/artifacts/Llama-2-7b-hf/short_report.csv delete mode 100644 examples/training-llamas/artifacts/Llama-2-7b-hf/training_throughput_bar_plot.png delete mode 100644 examples/training-llamas/artifacts/Llama-2-7b-hf/training_throughput_line_plot.png delete mode 100644 examples/training-llamas/configs/_base_.yaml delete mode 100644 examples/training-llamas/configs/fp16+dp=2.yaml delete mode 100644 examples/training-llamas/configs/fp16+fsdp=2.yaml delete mode 100644 examples/training-llamas/configs/fp16+peft+bnb-4bit+dp=2.yaml delete mode 100644 examples/training-llamas/configs/fp16+peft+bnb-4bit.yaml delete mode 100644 examples/training-llamas/configs/fp16+peft+dp=2+zero3.yaml delete mode 100644 examples/training-llamas/configs/fp16+peft+dp=2.yaml delete mode 100644 examples/training-llamas/configs/fp16+peft+gptq-4bit+dp=2.yaml delete mode 100644 examples/training-llamas/configs/fp16+peft+gptq-4bit.yaml delete mode 100644 examples/training-llamas/configs/fp16+peft.yaml delete mode 100644 examples/training-llamas/configs/fp16.yaml delete mode 100644 examples/training-llamas/report.py delete mode 100644 examples/whisper/README.md delete mode 100644 examples/whisper/configs/whisper_auto_opt+qnt.yaml delete mode 100644 examples/whisper/configs/whisper_auto_opt.yaml delete mode 100644 examples/whisper/configs/whisper_auto_qnt.yaml delete mode 100644 examples/whisper/configs/whisper_baseline.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(None)/5/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(None)/5/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(None)/5/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(None)/5/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(None)/5/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O1)/6/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O1)/6/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O1)/6/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O1)/6/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O1)/6/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O2)/7/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O2)/7/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O2)/7/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O2)/7/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O2)/7/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O3)/8/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O3)/8/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O3)/8/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O3)/8/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O3)/8/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O4)/9/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O4)/9/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O4)/9/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O4)/9/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_10/whisper_auto_opt(O4)/9/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(None)/15/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(None)/15/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(None)/15/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(None)/15/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(None)/15/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O1)/16/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O1)/16/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O1)/16/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O1)/16/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O1)/16/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O2)/17/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O2)/17/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O2)/17/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O2)/17/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O2)/17/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O3)/18/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O3)/18/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O3)/18/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O3)/18/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O3)/18/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O4)/19/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O4)/19/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O4)/19/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O4)/19/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_128_100/whisper_auto_opt(O4)/19/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(None)/0/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(None)/0/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(None)/0/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(None)/0/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(None)/0/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O1)/1/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O1)/1/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O1)/1/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O1)/1/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O1)/1/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O2)/2/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O2)/2/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O2)/2/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O2)/2/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O2)/2/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O3)/3/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O3)/3/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O3)/3/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O3)/3/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O3)/3/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O4)/4/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O4)/4/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O4)/4/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O4)/4/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_10/whisper_auto_opt(O4)/4/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(None)/10/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(None)/10/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(None)/10/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(None)/10/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(None)/10/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O1)/11/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O1)/11/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O1)/11/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O1)/11/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O1)/11/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O2)/12/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O2)/12/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O2)/12/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O2)/12/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O2)/12/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O3)/13/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O3)/13/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O3)/13/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O3)/13/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O3)/13/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O4)/14/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O4)/14/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O4)/14/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O4)/14/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_onnxruntime_64_100/whisper_auto_opt(O4)/14/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_10/whisper_baseline/1/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_10/whisper_baseline/1/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_10/whisper_baseline/1/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_10/whisper_baseline/1/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_10/whisper_baseline/1/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_100/whisper_baseline/3/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_100/whisper_baseline/3/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_100/whisper_baseline/3/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_100/whisper_baseline/3/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_128_100/whisper_baseline/3/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_10/whisper_baseline/0/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_10/whisper_baseline/0/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_10/whisper_baseline/0/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_10/whisper_baseline/0/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_10/whisper_baseline/0/inference_results.csv delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_100/whisper_baseline/2/.hydra/config.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_100/whisper_baseline/2/.hydra/hydra.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_100/whisper_baseline/2/.hydra/overrides.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_100/whisper_baseline/2/hydra_config.yaml delete mode 100644 examples/whisper/experiments/cuda_pytorch_64_100/whisper_baseline/2/inference_results.csv delete mode 100644 examples/whisper/reports/cuda_128_10/forward_throughput.png delete mode 100644 examples/whisper/reports/cuda_128_10/generate_throughput.png delete mode 100644 examples/whisper/reports/cuda_128_10/inference_report.csv delete mode 100644 examples/whisper/reports/cuda_128_10/rich_table.svg delete mode 100644 examples/whisper/reports/cuda_128_100/forward_throughput.png delete mode 100644 examples/whisper/reports/cuda_128_100/generate_throughput.png delete mode 100644 examples/whisper/reports/cuda_128_100/inference_report.csv delete mode 100644 examples/whisper/reports/cuda_128_100/rich_table.svg delete mode 100644 examples/whisper/reports/cuda_64_10/forward_throughput.png delete mode 100644 examples/whisper/reports/cuda_64_10/generate_throughput.png delete mode 100644 examples/whisper/reports/cuda_64_10/inference_report.csv delete mode 100644 examples/whisper/reports/cuda_64_10/rich_table.svg delete mode 100644 examples/whisper/reports/cuda_64_100/forward_throughput.png delete mode 100644 examples/whisper/reports/cuda_64_100/generate_throughput.png delete mode 100644 examples/whisper/reports/cuda_64_100/inference_report.csv delete mode 100644 examples/whisper/reports/cuda_64_100/rich_table.svg delete mode 100644 examples/whisper/scripts/benchmark.sh delete mode 100644 examples/whisper/scripts/report.sh diff --git a/.gitignore b/.gitignore index a8e86c83..ff31100b 100644 --- a/.gitignore +++ b/.gitignore @@ -167,8 +167,7 @@ sweeps/ data/ version.txt +.engine/ actions-runner/ experiments/ -examples/ -.engine/ -amdsmi \ No newline at end of file +amdsmi/ diff --git a/README.md b/README.md index 49889327..8b5e7368 100644 --- a/README.md +++ b/README.md @@ -1,8 +1,8 @@
-All benchmarks are wrong, some will cost you less than the others.
All benchmarks are wrong, some will cost you less than others.
- -
- -### Throughput - -For throughput, we consider the case of a server processing requests of average length (i.e. sequence length of 256). -We achieve a throughput of +2000 samples per second for the forward pass of the embedding model at an optimal batch size of 128 using either `CUDAExecutionProvider` with `O4` optimization level or `TensorrtExecutionProvider` with `fp16` precision. This can be seen as a 7.5x increase over the baseline pytorch model. - -- -
- -### Notes - -- The `TensorrtExecutionProvider` requires engine building, which can take a few minutes during model loading and the first forward pass. It also rebuilds the engine every time the sequence length changes. This is why I think that `CUDAExecutionProvider` with `O4` optimization level is the sweetspot for GPU inference. -- Some other cases, such as processing big batches of short sequences, can demonstrate even higher speedups (~15x). We don't study them here. diff --git a/examples/fast-mteb/artifacts/forward_latency_plot.png b/examples/fast-mteb/artifacts/forward_latency_plot.png deleted file mode 100644 index c4aecc6dbbe596441079c48856f52f2201347ab5..0000000000000000000000000000000000000000 GIT binary patch literal 0 HcmV?d00001 literal 31081 zcmd?Rc{rDC+ckVrN+?t)k*O3altMCukdUb;^N`Yj49QF(q)TMSj~H%_Sjq0Ie*z &e!wAM$aN
z;ktb?cvR}Nau%bT#FF-oyPWZRWU`f-6#GZ4Q;&TzaU44EG7>JqX55}|nmLh@l5+nr
z&PRk=!mag8`Y5hb#w)PU8_VtiyP*X`gdkT;BK9P> *Y&%{bAx1{@CQy@(
z%phdF{G}Fa1Uz&2rbx(2Kws$Fhg^3fPDfT4Qo8Xt;qdWuBje-zJ%k;SpFhF1@IPk0
zj~Y=pI>Z`ESQ%`eHs*9cMDI*3_t|@a
KAp9jKLaHs-Rgw9
zQq%hpdnu$Uh_>WGqBS?iKGx~0v8?Vr4BbDk+l9n1DZ2Xz$3-1vkhW^;+>xM=fx)>!
zw|A5Iq8g|9TE~YpXl6rSw>kAVuHEkZylJm0pLuxI^o}l%oTss@=Vx=xGn%x*Srmg{
zO(O3OLE{v0Tti(wyiQu4=#pEmYh0*O`jZm?o
zNx3r7snJe{clI`g{>4+#K+NiQ7D&~{@t5vI6
z+&yd9ZTW9K(^41&+E13RoXZbJRAi-SWeIi~gPRaZ21@YIK57w=M9v4cd^dI|@pd6+
zA~+-@L`xwZu3SV7$Zn}|tT)os)GR(|huygbACv^UK)6anEn6#xh@94p1QtvE+}R0Z
zuC3XYNC@cIBFu-YQY1)(sk)=1@YqIoXBQU&R3rN7C1F=!=jty|^wP}R@8IBIVsd2K
ztodxr$#3D?DLI&YiJOXo?Rxv