| #!/bin/bash |
|
|
| |
| python run_benchmark.py \ |
| --trace-file baseline.json.gz \ |
| --disable_bf16 \ |
| --compile_export_mode disabled \ |
| --disable_fused_projections \ |
| --disable_channels_last \ |
| --disable_fa3 \ |
| --disable_quant \ |
| --disable_inductor_tuning_flags \ |
| > baseline.txt 2>&1 |
|
|
| |
| python run_benchmark.py \ |
| --trace-file bfloat16.json.gz \ |
| --compile_export_mode disabled \ |
| --disable_fused_projections \ |
| --disable_channels_last \ |
| --disable_fa3 \ |
| --disable_quant \ |
| --disable_inductor_tuning_flags \ |
| > bf16.txt 2>&1 |
|
|
| |
| python run_benchmark.py \ |
| --trace-file bf16_compile.json.gz \ |
| --compile_export_mode compile \ |
| --disable_fused_projections \ |
| --disable_channels_last \ |
| --disable_fa3 \ |
| --disable_quant \ |
| --disable_inductor_tuning_flags \ |
| > bf16_compile.txt 2>&1 |
|
|
| |
| python run_benchmark.py \ |
| --trace-file bf16_compile_qkv.json.gz \ |
| --compile_export_mode compile \ |
| --disable_channels_last \ |
| --disable_fa3 \ |
| --disable_quant \ |
| --disable_inductor_tuning_flags \ |
| > bf16_compile_qkv.txt 2>&1 |
|
|
| |
| python run_benchmark.py \ |
| --trace-file bf16_compile_qkv_chan.json.gz \ |
| --compile_export_mode compile \ |
| --disable_fa3 \ |
| --disable_quant \ |
| --disable_inductor_tuning_flags \ |
| > bf16_compile_qkv_chan.txt 2>&1 |
|
|
| |
| python run_benchmark.py \ |
| --trace-file bf16_compile_qkv_chan_fa3.json.gz \ |
| --compile_export_mode compile \ |
| --disable_quant \ |
| --disable_inductor_tuning_flags \ |
| > bf16_compile_qkv_chan_fa3.txt 2>&1 |
|
|
| |
| python run_benchmark.py \ |
| --trace-file bf16_compile_qkv_chan_fa3_quant.json.gz \ |
| --compile_export_mode compile \ |
| --disable_inductor_tuning_flags \ |
| > bf16_compile_qkv_chan_fa3_quant.txt 2>&1 |
|
|
| |
| python run_benchmark.py \ |
| --trace-file bf16_compile_qkv_chan_fa3_quant_flags.json.gz \ |
| --compile_export_mode compile \ |
| > bf16_compile_qkv_chan_fa3_quant_flags.txt 2>&1 |
|
|
| |
| python run_benchmark.py --trace-file fully_optimized.json.gz \ |
| > fully_optimized.txt 2>&1 |
|
|