Upload folder using huggingface_hub
Browse files- -_0_0_0/after_recompile_pre_grad_3.txt +13 -0
- -_0_0_0/aot_forward_graph_fw_metadata_4.txt +57 -0
- -_0_0_0/aot_inference_graph_5.txt +6 -0
- -_0_0_0/aotautograd_cache_bypass_9.json +8 -0
- -_0_0_0/before_recompile_pre_grad_2.txt +13 -0
- -_0_0_0/compilation_metrics_11.html +152 -0
- -_0_0_0/dynamo_cpp_guards_str_10.txt +47 -0
- -_0_0_0/dynamo_output_graph_0.txt +13 -0
- -_0_0_0/fx_graph_cache_hit_8.json +315 -0
- -_0_0_0/inductor_output_code_ch44xxkifazlcpkp6mi44xhqeej2j5mbgwmesiwx6y3oajzmixxp_7.html +67 -0
- -_0_0_0/inductor_pre_grad_graph_1.txt +15 -0
- -_0_0_0/torch._functorch.config_6.txt +36 -0
- chromium_events.json +962 -0
- compile_directory.json +78 -0
- failures_and_restarts.html +72 -0
- index.html +202 -0
- raw.log +0 -0
-_0_0_0/after_recompile_pre_grad_3.txt
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
class GraphModule(torch.nn.Module):
|
| 2 |
+
def forward(self, L_w_: "f32[4096, 8192][8192, 1]cuda:0", L_scale_: "f32[4096][1]cuda:0", L_zero_point_: "i32[4096][1]cuda:0"):
|
| 3 |
+
l_w_ = L_w_
|
| 4 |
+
l_scale_ = L_scale_
|
| 5 |
+
l_zero_point_ = L_zero_point_
|
| 6 |
+
|
| 7 |
+
# File: /shared_volume/repos/quark/bench_qdq.py:8 in run_scaled_fake_quantize, code: return scaled_fake_quantize(quant_dtype, w, scale, zero_point, axis, group_size, quant_min, quant_max, round_mode, qscheme, mx_element_dtype)
|
| 8 |
+
function_ctx = torch.autograd.function.FunctionCtx(); function_ctx = None
|
| 9 |
+
|
| 10 |
+
# File: /shared_volume/repos/quark/quark/torch/kernel/__init__.py:168 in forward, code: return ops.quark.scaled_fake_quantize(quant_dtype, inputs, scale, zero_point, axis, group_size, quant_min,
|
| 11 |
+
scaled_fake_quantize: "f32[4096, 8192][8192, 1]cuda:0" = torch.ops.quark.scaled_fake_quantize('int4', l_w_, l_scale_, l_zero_point_, 0, 0, 0, 15, 0, 'per_channel', 'haha'); l_w_ = l_scale_ = l_zero_point_ = None
|
| 12 |
+
return (scaled_fake_quantize,)
|
| 13 |
+
|
-_0_0_0/aot_forward_graph_fw_metadata_4.txt
ADDED
|
@@ -0,0 +1,57 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
ViewAndMutationMeta(input_info=[InputAliasInfo(is_leaf=True,
|
| 2 |
+
mutates_data=False,
|
| 3 |
+
mutates_metadata=False,
|
| 4 |
+
mutations_hidden_from_autograd=True,
|
| 5 |
+
mutations_under_no_grad_or_inference_mode=False,
|
| 6 |
+
mutation_inductor_storage_resize=False,
|
| 7 |
+
mutates_storage_metadata=False,
|
| 8 |
+
requires_grad=False,
|
| 9 |
+
keep_input_mutations=True),
|
| 10 |
+
InputAliasInfo(is_leaf=True,
|
| 11 |
+
mutates_data=False,
|
| 12 |
+
mutates_metadata=False,
|
| 13 |
+
mutations_hidden_from_autograd=True,
|
| 14 |
+
mutations_under_no_grad_or_inference_mode=False,
|
| 15 |
+
mutation_inductor_storage_resize=False,
|
| 16 |
+
mutates_storage_metadata=False,
|
| 17 |
+
requires_grad=False,
|
| 18 |
+
keep_input_mutations=True),
|
| 19 |
+
InputAliasInfo(is_leaf=True,
|
| 20 |
+
mutates_data=False,
|
| 21 |
+
mutates_metadata=False,
|
| 22 |
+
mutations_hidden_from_autograd=True,
|
| 23 |
+
mutations_under_no_grad_or_inference_mode=False,
|
| 24 |
+
mutation_inductor_storage_resize=False,
|
| 25 |
+
mutates_storage_metadata=False,
|
| 26 |
+
requires_grad=False,
|
| 27 |
+
keep_input_mutations=True)],
|
| 28 |
+
output_info=[OutputAliasInfo(output_type=<OutputType.non_alias: 1>,
|
| 29 |
+
raw_type=<class 'torch._subclasses.functional_tensor.FunctionalTensor'>,
|
| 30 |
+
base_idx=None,
|
| 31 |
+
dynamic_dims=set(),
|
| 32 |
+
requires_grad=False,
|
| 33 |
+
functional_tensor=None)],
|
| 34 |
+
num_intermediate_bases=0,
|
| 35 |
+
keep_input_mutations=True,
|
| 36 |
+
traced_tangents=[],
|
| 37 |
+
subclass_inp_meta=[PlainTensorMeta(unwrapped_idx=0,
|
| 38 |
+
memory_format=None),
|
| 39 |
+
PlainTensorMeta(unwrapped_idx=1,
|
| 40 |
+
memory_format=None),
|
| 41 |
+
PlainTensorMeta(unwrapped_idx=2,
|
| 42 |
+
memory_format=None)],
|
| 43 |
+
subclass_fw_graph_out_meta=[PlainTensorMeta(unwrapped_idx=0,
|
| 44 |
+
memory_format=None)],
|
| 45 |
+
subclass_tangent_meta=[],
|
| 46 |
+
is_train=False,
|
| 47 |
+
traced_tangent_metas=None,
|
| 48 |
+
num_symints_saved_for_bw=None,
|
| 49 |
+
grad_enabled_mutation=None,
|
| 50 |
+
deterministic=None,
|
| 51 |
+
static_input_indices=[],
|
| 52 |
+
tokens={},
|
| 53 |
+
indices_of_inputs_that_requires_grad_with_mutations_in_bw=[],
|
| 54 |
+
bw_donated_idxs=None,
|
| 55 |
+
num_backward_tokens=0,
|
| 56 |
+
num_graphsafe_rng_states=0,
|
| 57 |
+
graphsafe_rng_state_index=None)
|
-_0_0_0/aot_inference_graph_5.txt
ADDED
|
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
class <lambda>(torch.nn.Module):
|
| 2 |
+
def forward(self, arg0_1: "f32[4096, 8192][8192, 1]cuda:0", arg1_1: "f32[4096][1]cuda:0", arg2_1: "i32[4096][1]cuda:0"):
|
| 3 |
+
# File: /shared_volume/repos/quark/quark/torch/kernel/__init__.py:168 in forward, code: return ops.quark.scaled_fake_quantize(quant_dtype, inputs, scale, zero_point, axis, group_size, quant_min,
|
| 4 |
+
scaled_fake_quantize: "f32[4096, 8192][8192, 1]cuda:0" = torch.ops.quark.scaled_fake_quantize.default('int4', arg0_1, arg1_1, arg2_1, 0, 0, 0.0, 15.0, 0, 'per_channel', 'haha'); arg0_1 = arg1_1 = arg2_1 = None
|
| 5 |
+
return (scaled_fake_quantize,)
|
| 6 |
+
|
-_0_0_0/aotautograd_cache_bypass_9.json
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cache_bypass_hard_exception": false,
|
| 3 |
+
"cache_bypass_reason": "Unsupported call_function target <class 'torch.autograd.function.FunctionCtx'>. \n Function module: torch.autograd.function, \nFunction name: FunctionCtx",
|
| 4 |
+
"cache_state": "bypass",
|
| 5 |
+
"compile_id": "0/0",
|
| 6 |
+
"components": [],
|
| 7 |
+
"key": null
|
| 8 |
+
}
|
-_0_0_0/before_recompile_pre_grad_2.txt
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
class GraphModule(torch.nn.Module):
|
| 2 |
+
def forward(self, L_w_: "f32[4096, 8192][8192, 1]cuda:0", L_scale_: "f32[4096][1]cuda:0", L_zero_point_: "i32[4096][1]cuda:0"):
|
| 3 |
+
l_w_ = L_w_
|
| 4 |
+
l_scale_ = L_scale_
|
| 5 |
+
l_zero_point_ = L_zero_point_
|
| 6 |
+
|
| 7 |
+
# File: /shared_volume/repos/quark/bench_qdq.py:8 in run_scaled_fake_quantize, code: return scaled_fake_quantize(quant_dtype, w, scale, zero_point, axis, group_size, quant_min, quant_max, round_mode, qscheme, mx_element_dtype)
|
| 8 |
+
function_ctx = torch.autograd.function.FunctionCtx(); function_ctx = None
|
| 9 |
+
|
| 10 |
+
# File: /shared_volume/repos/quark/quark/torch/kernel/__init__.py:168 in forward, code: return ops.quark.scaled_fake_quantize(quant_dtype, inputs, scale, zero_point, axis, group_size, quant_min,
|
| 11 |
+
scaled_fake_quantize: "f32[4096, 8192][8192, 1]cuda:0" = torch.ops.quark.scaled_fake_quantize('int4', l_w_, l_scale_, l_zero_point_, 0, 0, 0, 15, 0, 'per_channel', 'haha'); l_w_ = l_scale_ = l_zero_point_ = None
|
| 12 |
+
return (scaled_fake_quantize,)
|
| 13 |
+
|
-_0_0_0/compilation_metrics_11.html
ADDED
|
@@ -0,0 +1,152 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
<html>
|
| 3 |
+
<head>
|
| 4 |
+
<style>
|
| 5 |
+
|
| 6 |
+
table td { vertical-align: top; }
|
| 7 |
+
|
| 8 |
+
.stack-trie { white-space: nowrap; font-family: monospace; }
|
| 9 |
+
.stack-trie ul { padding-left: 1ch; }
|
| 10 |
+
.stack-trie li { margin-left: 1ch; list-style-type: none; }
|
| 11 |
+
.stack-trie .marker {
|
| 12 |
+
cursor: pointer;
|
| 13 |
+
}
|
| 14 |
+
.stack-trie .marker.collapsed::before {
|
| 15 |
+
content: "+ ";
|
| 16 |
+
}
|
| 17 |
+
.stack-trie .marker:not(.collapsed)::before {
|
| 18 |
+
content: "- ";
|
| 19 |
+
}
|
| 20 |
+
.stack-trie a { text-decoration: none; }
|
| 21 |
+
.stack-trie a:hover { text-decoration: underline; }
|
| 22 |
+
.status-missing { background-color: purple; color: white; }
|
| 23 |
+
.status-error { background-color: red; color: white; }
|
| 24 |
+
.status-empty { background-color: white; color: black; }
|
| 25 |
+
.status-ok { background-color: green; color: white; }
|
| 26 |
+
.status-break { background-color: lime; color: black; }
|
| 27 |
+
summary::-webkit-details-marker { color: #00ACF3; font-size: 125%; margin-right: 2px; }
|
| 28 |
+
summary:focus { outline-style: none; }
|
| 29 |
+
article > details > summary { font-size: 28px; margin-top: 16px; }
|
| 30 |
+
details > p { margin-left: 24px; }
|
| 31 |
+
details details summary { font-size: 16px; }
|
| 32 |
+
|
| 33 |
+
</style>
|
| 34 |
+
<title>Compilation Metrics</title>
|
| 35 |
+
<base href="..">
|
| 36 |
+
</head>
|
| 37 |
+
<body>
|
| 38 |
+
<h1>Compilation Info for [0/0] </h1>
|
| 39 |
+
<p><details><summary>Stack</summary><div class='stack-trie'><ul><li>/shared_volume/repos/quark/bench_qdq.py:7 in run_scaled_fake_quantize<br> </li>
|
| 40 |
+
</ul></div></details></p>
|
| 41 |
+
<h2>Output files:</h2>
|
| 42 |
+
<ul>
|
| 43 |
+
|
| 44 |
+
<li><a href="-_0_0_0/dynamo_output_graph_0.txt">dynamo_output_graph_0.txt</a> (0)</li>
|
| 45 |
+
|
| 46 |
+
<li><a href="-_0_0_0/inductor_pre_grad_graph_1.txt">inductor_pre_grad_graph_1.txt</a> (1)</li>
|
| 47 |
+
|
| 48 |
+
<li><a href="-_0_0_0/before_recompile_pre_grad_2.txt">before_recompile_pre_grad_2.txt</a> (2)</li>
|
| 49 |
+
|
| 50 |
+
<li><a href="-_0_0_0/after_recompile_pre_grad_3.txt">after_recompile_pre_grad_3.txt</a> (3)</li>
|
| 51 |
+
|
| 52 |
+
<li><a href="-_0_0_0/aot_forward_graph_fw_metadata_4.txt">aot_forward_graph_fw_metadata_4.txt</a> (4)</li>
|
| 53 |
+
|
| 54 |
+
<li><a href="-_0_0_0/aot_inference_graph_5.txt">aot_inference_graph_5.txt</a> (5)</li>
|
| 55 |
+
|
| 56 |
+
<li><a href="-_0_0_0/torch._functorch.config_6.txt">torch._functorch.config_6.txt</a> (6)</li>
|
| 57 |
+
|
| 58 |
+
<li><a href="-_0_0_0/inductor_output_code_ch44xxkifazlcpkp6mi44xhqeej2j5mbgwmesiwx6y3oajzmixxp_7.html">inductor_output_code_ch44xxkifazlcpkp6mi44xhqeej2j5mbgwmesiwx6y3oajzmixxp_7.html</a> (7)</li>
|
| 59 |
+
|
| 60 |
+
<li><a href="-_0_0_0/fx_graph_cache_hit_8.json">fx_graph_cache_hit_8.json</a> (8)</li>
|
| 61 |
+
|
| 62 |
+
<li><a href="-_0_0_0/aotautograd_cache_bypass_9.json">aotautograd_cache_bypass_9.json</a> (9)</li>
|
| 63 |
+
|
| 64 |
+
<li><a href="-_0_0_0/dynamo_cpp_guards_str_10.txt">dynamo_cpp_guards_str_10.txt</a> (10)</li>
|
| 65 |
+
|
| 66 |
+
</ul>
|
| 67 |
+
<h2>Stack</h2>
|
| 68 |
+
<details><summary>Stack</summary><div class='stack-trie'><ul><li>/shared_volume/repos/quark/bench_qdq.py:161 in <module><br> mean, median = do_bench(run_scaled_fake_quantize_comp, kwargs_scaled_fake_quantize, num_runs=num_runs, num_warmup=num_warmup, name="quark qdq")</li>
|
| 69 |
+
<li>/shared_volume/repos/quark/bench_qdq.py:70 in do_bench<br> f(**kwargs)</li>
|
| 70 |
+
<li>/shared_volume/repos/quark/bench_qdq.py:7 in run_scaled_fake_quantize<br> </li>
|
| 71 |
+
</ul></div></details>
|
| 72 |
+
<h2>Compile Time(seconds)</h2>
|
| 73 |
+
<p>Entire Frame <abbr title="Total time spent in convert_frame function">[?]</abbr>: 1.068891</div>
|
| 74 |
+
<p>Backend <abbr title="Time spent running the backend compiler">[?]</abbr>: 0.992908</div>
|
| 75 |
+
|
| 76 |
+
<p>Inductor <abbr title="Total time spent running inductor">[?]</abbr>: 0.414598</div>
|
| 77 |
+
|
| 78 |
+
|
| 79 |
+
<div>Dynamo Time Before Restart <abbr title="Total time spent restarting dynamo analysis">[?]</abbr>: 0.0</div>
|
| 80 |
+
<h2>Restarts and Failures</h2>
|
| 81 |
+
|
| 82 |
+
<p> No failures! </p>
|
| 83 |
+
|
| 84 |
+
|
| 85 |
+
<p> No restarts! </p>
|
| 86 |
+
|
| 87 |
+
<h2>Cache Metrics</h2>
|
| 88 |
+
<p>Cache Size: 0</p>
|
| 89 |
+
<p>Accumulated Cache Size: 0</p>
|
| 90 |
+
<h2>Graph Metrics</h2>
|
| 91 |
+
<p>Guard Count: 21</p>
|
| 92 |
+
<p>Shape Env Guards: 0</p>
|
| 93 |
+
<p>Graph Ops: 2</p>
|
| 94 |
+
<p>Graph Nodes: 6</p>
|
| 95 |
+
<p>Graph Inputs: 3</p>
|
| 96 |
+
<h2> Custom Ops </h2>
|
| 97 |
+
|
| 98 |
+
|
| 99 |
+
<p> Non-Compliant Custom Ops:</p>
|
| 100 |
+
|
| 101 |
+
<li> <code> quark::scaled_fake_quantize </code> </li>
|
| 102 |
+
|
| 103 |
+
|
| 104 |
+
<h2>Symbolic shape specializations</h2>
|
| 105 |
+
<table>
|
| 106 |
+
<tr>
|
| 107 |
+
<th>Sym</th> <th>Source(s)</th> <th>Value</th> <th>User stack</th> <th>Framework stack</th>
|
| 108 |
+
</tr>
|
| 109 |
+
|
| 110 |
+
</table>
|
| 111 |
+
<h2>Guards added fast</h2>
|
| 112 |
+
<table>
|
| 113 |
+
<tr>
|
| 114 |
+
<th>Expr</th> <th>User stack</th> <th>Framework stack</th>
|
| 115 |
+
</tr>
|
| 116 |
+
|
| 117 |
+
</table>
|
| 118 |
+
|
| 119 |
+
<script>
|
| 120 |
+
document.addEventListener('DOMContentLoaded', function() {
|
| 121 |
+
|
| 122 |
+
// Append the current URL's query parameters to all relative links on the page
|
| 123 |
+
const queryParams = new URLSearchParams(window.location.search);
|
| 124 |
+
if (queryParams.size === 0) return url; // No query params, return original URL
|
| 125 |
+
|
| 126 |
+
function appendQueryParams(url) {
|
| 127 |
+
const newURL = new URL((new Request(url)).url); // new URL(<relative URL>) but it actually works
|
| 128 |
+
const newSearchParams = new URLSearchParams(newURL.searchParams);
|
| 129 |
+
console.log(newURL.searchParams);
|
| 130 |
+
console.log(newSearchParams);
|
| 131 |
+
|
| 132 |
+
// Append query parameters
|
| 133 |
+
for (const [key, value] of queryParams) {
|
| 134 |
+
newSearchParams.set(key, value);
|
| 135 |
+
}
|
| 136 |
+
|
| 137 |
+
newURL.search = newSearchParams;
|
| 138 |
+
return newURL;
|
| 139 |
+
}
|
| 140 |
+
|
| 141 |
+
// Select all relative links on the page
|
| 142 |
+
const relativeLinks = document.querySelectorAll('a[href]:not([href^="http://"]):not([href^="https://"]):not([href^="\#"])');
|
| 143 |
+
|
| 144 |
+
// Append query parameters to each relative link
|
| 145 |
+
relativeLinks.forEach((link) => {
|
| 146 |
+
link.setAttribute("href", appendQueryParams(link.getAttribute("href")))
|
| 147 |
+
});
|
| 148 |
+
});
|
| 149 |
+
</script>
|
| 150 |
+
|
| 151 |
+
</body>
|
| 152 |
+
</html>
|
-_0_0_0/dynamo_cpp_guards_str_10.txt
ADDED
|
@@ -0,0 +1,47 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
TREE_GUARD_MANAGER:
|
| 3 |
+
+- RootGuardManager
|
| 4 |
+
| +- DEFAULT_DEVICE: utils_device.CURRENT_DEVICE == None # _dynamo/output_graph.py:520 in init_ambient_guards
|
| 5 |
+
| +- GLOBAL_STATE: ___check_global_state()
|
| 6 |
+
| +- TORCH_FUNCTION_MODE_STACK: ___check_torch_function_mode_stack()
|
| 7 |
+
| +- GuardManager: source=L['w'], accessed_by=FrameLocalsGuardAccessor(key='w', framelocals_idx=1)
|
| 8 |
+
| | +- TENSOR_MATCH: check_tensor(L['w'], Tensor, DispatchKeySet(CUDA, BackendSelect, ADInplaceOrView, AutogradCUDA), torch.float32, device=0, requires_grad=False, size=[4096, 8192], stride=[8192, 1])
|
| 9 |
+
| | +- NO_HASATTR: hasattr(L['w'], '_dynamo_dynamic_indices') == False
|
| 10 |
+
| | +- NO_TENSOR_ALIASING: check_no_aliasing(L['w'], L['scale'], L['zero_point'])
|
| 11 |
+
| +- GuardManager: source=L['axis'], accessed_by=FrameLocalsGuardAccessor(key='axis', framelocals_idx=4)
|
| 12 |
+
| | +- EQUALS_MATCH: L['axis'] == 0
|
| 13 |
+
| +- GuardManager: source=L['scale'], accessed_by=FrameLocalsGuardAccessor(key='scale', framelocals_idx=2)
|
| 14 |
+
| | +- TENSOR_MATCH: check_tensor(L['scale'], Tensor, DispatchKeySet(CUDA, BackendSelect, ADInplaceOrView, AutogradCUDA), torch.float32, device=0, requires_grad=False, size=[4096], stride=[1])
|
| 15 |
+
| | +- NO_HASATTR: hasattr(L['scale'], '_dynamo_dynamic_indices') == False
|
| 16 |
+
| | +- NO_TENSOR_ALIASING
|
| 17 |
+
| +- GuardManager: source=L['qscheme'], accessed_by=FrameLocalsGuardAccessor(key='qscheme', framelocals_idx=9)
|
| 18 |
+
| | +- EQUALS_MATCH: L['qscheme'] == 'per_channel'
|
| 19 |
+
| +- GuardManager: source=L['quant_max'], accessed_by=FrameLocalsGuardAccessor(key='quant_max', framelocals_idx=7)
|
| 20 |
+
| | +- EQUALS_MATCH: L['quant_max'] == 15
|
| 21 |
+
| +- GuardManager: source=L['quant_min'], accessed_by=FrameLocalsGuardAccessor(key='quant_min', framelocals_idx=6)
|
| 22 |
+
| | +- EQUALS_MATCH: L['quant_min'] == 0
|
| 23 |
+
| +- GuardManager: source=L['group_size'], accessed_by=FrameLocalsGuardAccessor(key='group_size', framelocals_idx=5)
|
| 24 |
+
| | +- EQUALS_MATCH: L['group_size'] == 0
|
| 25 |
+
| +- GuardManager: source=L['round_mode'], accessed_by=FrameLocalsGuardAccessor(key='round_mode', framelocals_idx=8)
|
| 26 |
+
| | +- EQUALS_MATCH: L['round_mode'] == 0
|
| 27 |
+
| +- GuardManager: source=L['zero_point'], accessed_by=FrameLocalsGuardAccessor(key='zero_point', framelocals_idx=3)
|
| 28 |
+
| | +- TENSOR_MATCH: check_tensor(L['zero_point'], Tensor, DispatchKeySet(CUDA, BackendSelect, ADInplaceOrView, AutogradCUDA), torch.int32, device=0, requires_grad=False, size=[4096], stride=[1])
|
| 29 |
+
| | +- NO_HASATTR: hasattr(L['zero_point'], '_dynamo_dynamic_indices') == False
|
| 30 |
+
| | +- NO_TENSOR_ALIASING
|
| 31 |
+
| +- GuardManager: source=L['quant_dtype'], accessed_by=FrameLocalsGuardAccessor(key='quant_dtype', framelocals_idx=0)
|
| 32 |
+
| | +- EQUALS_MATCH: L['quant_dtype'] == 'int4'
|
| 33 |
+
| +- GuardManager: source=L['mx_element_dtype'], accessed_by=FrameLocalsGuardAccessor(key='mx_element_dtype', framelocals_idx=10)
|
| 34 |
+
| | +- EQUALS_MATCH: L['mx_element_dtype'] == 'haha'
|
| 35 |
+
| +- GuardManager: source=G, accessed_by=GlobalsGuardAccessor
|
| 36 |
+
| | +- GuardManager: source=G['scaled_fake_quantize'], accessed_by=DictGetItemGuardAccessor('scaled_fake_quantize')
|
| 37 |
+
| | | +- ID_MATCH: ___check_obj_id(G['scaled_fake_quantize'], 140615015598720)
|
| 38 |
+
| | +- GuardManager: source=G['__import_quark_dot_torch_dot_kernel'], accessed_by=DictGetItemGuardAccessor('__import_quark_dot_torch_dot_kernel')
|
| 39 |
+
| | | +- ID_MATCH: ___check_obj_id(G['__import_quark_dot_torch_dot_kernel'], 140649485511360)
|
| 40 |
+
| | | +- GuardManager: source=G['__import_quark_dot_torch_dot_kernel'].ops, accessed_by=GetAttrGuardAccessor(ops)
|
| 41 |
+
| | | | +- ID_MATCH: ___check_obj_id(G['__import_quark_dot_torch_dot_kernel'].ops, 140649515082000)
|
| 42 |
+
| | | | +- GuardManager: source=G['__import_quark_dot_torch_dot_kernel'].ops.quark, accessed_by=GetAttrGuardAccessor(quark)
|
| 43 |
+
| | | | | +- ID_MATCH: ___check_obj_id(G['__import_quark_dot_torch_dot_kernel'].ops.quark, 140649455882608)
|
| 44 |
+
| | | | | +- GuardManager: source=G['__import_quark_dot_torch_dot_kernel'].ops.quark.scaled_fake_quantize, accessed_by=GetAttrGuardAccessor(scaled_fake_quantize)
|
| 45 |
+
| | | | | | +- ID_MATCH: ___check_obj_id(G['__import_quark_dot_torch_dot_kernel'].ops.quark.scaled_fake_quantize, 140614946665776)
|
| 46 |
+
|
| 47 |
+
Guard latency = 0.84 us
|
-_0_0_0/dynamo_output_graph_0.txt
ADDED
|
@@ -0,0 +1,13 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
class GraphModule(torch.nn.Module):
|
| 2 |
+
def forward(self, L_w_: "f32[4096, 8192][8192, 1]cuda:0", L_scale_: "f32[4096][1]cuda:0", L_zero_point_: "i32[4096][1]cuda:0"):
|
| 3 |
+
l_w_ = L_w_
|
| 4 |
+
l_scale_ = L_scale_
|
| 5 |
+
l_zero_point_ = L_zero_point_
|
| 6 |
+
|
| 7 |
+
# File: /shared_volume/repos/quark/bench_qdq.py:8 in run_scaled_fake_quantize, code: return scaled_fake_quantize(quant_dtype, w, scale, zero_point, axis, group_size, quant_min, quant_max, round_mode, qscheme, mx_element_dtype)
|
| 8 |
+
function_ctx = torch.autograd.function.FunctionCtx(); function_ctx = None
|
| 9 |
+
|
| 10 |
+
# File: /shared_volume/repos/quark/quark/torch/kernel/__init__.py:168 in forward, code: return ops.quark.scaled_fake_quantize(quant_dtype, inputs, scale, zero_point, axis, group_size, quant_min,
|
| 11 |
+
scaled_fake_quantize: "f32[4096, 8192][8192, 1]cuda:0" = torch.ops.quark.scaled_fake_quantize('int4', l_w_, l_scale_, l_zero_point_, 0, 0, 0, 15, 0, 'per_channel', 'haha'); l_w_ = l_scale_ = l_zero_point_ = None
|
| 12 |
+
return (scaled_fake_quantize,)
|
| 13 |
+
|
-_0_0_0/fx_graph_cache_hit_8.json
ADDED
|
@@ -0,0 +1,315 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"cache_event_time": 1750251842521445359,
|
| 3 |
+
"cache_state": "hit",
|
| 4 |
+
"compile_id": "0/0",
|
| 5 |
+
"components": [
|
| 6 |
+
"[b6z7ijvsnbtjurvqwdotlb6qtuyjsz4krtpkqj5thbq3fhqsbhp] gm: <lambda>()\n\n\n\ndef forward(self, arg0_1, arg1_1, arg2_1):\n scaled_fake_quantize = torch.ops.quark.scaled_fake_quantize.default('int4', arg0_1, arg1_1, arg2_1, 0, 0, 0.0, 15.0, 0, 'per_channel', 'haha'); arg0_1 = arg1_1 = arg2_1 = None\n return (scaled_fake_quantize,)\n \n# To see more debug info, please use `graph_module.print_readable()`",
|
| 7 |
+
"[nef3d47wx7hdxcyvwgucihijvag3qlbodqmms7dktjkxqgk4gux] example_inputs[0]: TensorMetadata(dtype=torch.float32, shape=torch.Size([4096, 8192]), stride=(8192, 1), device=device(type='cuda', index=0), layout=torch.strided, memory_format=torch.contiguous_format, storage_offset=0, storage_bytes=None, requires_grad=False, is_quantized=False, is_conj=False, is_neg=False, is_inference=False, is_sparse=False, is_coalesced=None, dense_dim=None, sparse_dim=None)",
|
| 8 |
+
"[7eps4cy57l62xkqx7rnf6ttfsuweegaqsqravzj2x5h4v6fbtod] example_inputs[1]: TensorMetadata(dtype=torch.float32, shape=torch.Size([4096]), stride=(1,), device=device(type='cuda', index=0), layout=torch.strided, memory_format=torch.contiguous_format, storage_offset=0, storage_bytes=None, requires_grad=False, is_quantized=False, is_conj=False, is_neg=False, is_inference=False, is_sparse=False, is_coalesced=None, dense_dim=None, sparse_dim=None)",
|
| 9 |
+
"[dpovg5nw4n7fkaetfrkwcqepypqcssr7fzpd75svn53n4xjxfow] example_inputs[2]: TensorMetadata(dtype=torch.int32, shape=torch.Size([4096]), stride=(1,), device=device(type='cuda', index=0), layout=torch.strided, memory_format=torch.contiguous_format, storage_offset=0, storage_bytes=None, requires_grad=False, is_quantized=False, is_conj=False, is_neg=False, is_inference=False, is_sparse=False, is_coalesced=None, dense_dim=None, sparse_dim=None)",
|
| 10 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] cache_key_tag: ",
|
| 11 |
+
"[lmglpn4zi7vob56n34r2j2rk7flv5xfgrcvmo7xcpirqsitygqx] fx_kwargs[boxed_forward_device_index]: BoxedDeviceIndex(value=None)",
|
| 12 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] fx_kwargs[cpp_wrapper]: False",
|
| 13 |
+
"[xq2hdkbfkbcuye6rgtypayrkhqf4cntij2dsd24rei3lsknakkf] fx_kwargs[cudagraphs]: BoxedBool(value=False)",
|
| 14 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] fx_kwargs[extern_node_serializer]: None",
|
| 15 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] fx_kwargs[is_backward]: False",
|
| 16 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] fx_kwargs[is_inference]: True",
|
| 17 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] fx_kwargs[layout_opt]: None",
|
| 18 |
+
"[h25wqx6vliw4j5rtzzbv6latydxyei3deyg6v7wzvnzryfktuki] fx_kwargs[static_input_idxs]: []",
|
| 19 |
+
"[vrl5ktomgtzox5xucd3np6vug3vyj6hwwzahqijuwpmamlv7ohi] inputs_to_check[0]: 0",
|
| 20 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inputs_to_check[1]: 1",
|
| 21 |
+
"[pr5nr4a7dthirgd2ljo3d2xakc63ywxugusu6mkmr6gmpeliyib] inputs_to_check[2]: 2",
|
| 22 |
+
"[du4vyrfyozrfxcf6kk6ma7oqwatapifazeelfsawmsiu6gjdtxp] deterministic_algorithms_settings: (False, False, True)",
|
| 23 |
+
"[qiptf2633zubseuei4bkisoq3not35l6lud6p23p4qmcsxiw2uq] cuda_matmul_settings: (False, True, True)",
|
| 24 |
+
"[ol6sj5vrtmgqd5cnfjbun7wbukfn7jyrtpkapnhmsysjdypit4i] torch_version: <bytes>",
|
| 25 |
+
"[rlwghyno43ot2zz35l3xlcrrh3arqenri6t5nsopt3t3q333zgy] system_info[device]: {'name': 'gfx942:sramecc+:xnack-'}",
|
| 26 |
+
"[njkbnmcun3rnt2yz2lgf57oprgdbjzlkadbcfoy57sir5fnskzg] system_info[version]: {'triton': '3.3.02e234c1d93a7cae949341b60b8567f825914128ed598e1d846c8bc19a9d65ad8-364a7d1dd5f29867a741138f83c5b453259e240a5d51f364f24f7196cedbf442-2e234c1d93a7cae949341b60b8567f825914128ed598e1d846c8bc19a9d65ad8-23d635e690d670bf61798e1259674b78c0ed5ba222ab6a455f329f27a758fc2d-e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855-ca6686d24a6f780b8449b43d419d11c978ebd00ab87a5fc6e57198a2027680d0-00deb4ba92653e089ad09c2f67cbc85602c84cd3ee2347ddcfcccc2081cfa45e-e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855-78995dd40c4e54964f62cdc6d47e66f6d9df8b55b172ad7eb99235f27999c840-f7c26e8ffdaf8cd2491de04217d32827b1a4f859f7f93ea56e26590c9f5e071a-a5b982237b29a230519ad566660a5912ae9d31da0dd6388465f3a1043b12ece7-6e4a7df0c1f6cb799f488ee1d6efd3df754fc18aac6e7209923bb022c36c7c4e-f983f9d6d6f987af520297c8fe3185601ae8f7d60bacab880ac9326bdfee1f67-5d15c5bebef8d7aa51b21fd187e5faa95eba4a213254355bc69e0648013599f7-26a8aeaf21e759191f173b578316e243ad970387442a1b238481c6a1b2eecdc4-bd364752852b76a0b75a9d93ecbc239781b730aa75021445a02d795aa8d38f6a-72bc1771d8b160fbafcd5390d1ee6cb72440c10ad4834451465a9e93b42f5d1c-7b506c955ee5646862dae548968e6523d75c37ad4750c214d9ab0f6918ecc88a-89e4844782de5fdff4868ac2846514570a6e280a6b92e91af2e180904043c833-115ada51f797cd098ddc5e4b95e8369a885571b15639694b6801f59e46eab55e-0e48b5e1e95136642ccfe62dc3d0a739a2c20a7b5ee13e9c23c6cecd68cdeb70-b616015f724e553348f5b019f7324dec130f7bbaf984d43300fa69c7c2fdda2f-54fe722cbe379a55695ab9478e73d344377cf5e9d6e055aff7cd03bf6fff1b2a-10285555cd515e21ca54714fc8eb9c173cca6b092b5e951a17ae5eee28ed2707-f2d4e73182e68eddc6237577b2158b7d8498ccb3c50642b9c74c55d3f4be3943', 'hip': '6.3.42131-fa1d09cbd'}",
|
| 27 |
+
"[3qefpuc3yyxaxf25vrqt6skezzayzydwq2o6i2xf2qdyioam5zw] system_info[hash]: 6e7af1eb52fca9b11dcfccdeb7b2a74263a0c6d2c07fe2b7f2c2003a4663609b",
|
| 28 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[TYPE_CHECKING]: False",
|
| 29 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[inplace_padding]: True",
|
| 30 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[can_inplace_pad_graph_input]: False",
|
| 31 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[enable_auto_functionalized_v2]: True",
|
| 32 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug]: False",
|
| 33 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[disable_progress]: True",
|
| 34 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[verbose_progress]: False",
|
| 35 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[fx_graph_cache]: True",
|
| 36 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[fx_graph_remote_cache]: None",
|
| 37 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[bundle_triton_into_fx_graph_cache]: True",
|
| 38 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[autotune_local_cache]: True",
|
| 39 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[autotune_remote_cache]: None",
|
| 40 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[bundled_autotune_remote_cache]: None",
|
| 41 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_disable_caches]: False",
|
| 42 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[sleep_sec_TESTING_ONLY]: None",
|
| 43 |
+
"[pikr7bbcoixfzftsazp5ggufhdklj24babfry77bl4nuvyrrcp4] inductor_config[custom_op_default_layout_constraint]: needs_fixed_stride_order",
|
| 44 |
+
"[pikr7bbcoixfzftsazp5ggufhdklj24babfry77bl4nuvyrrcp4] inductor_config[triton_kernel_default_layout_constraint]: needs_fixed_stride_order",
|
| 45 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp_wrapper]: False",
|
| 46 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[online_softmax]: True",
|
| 47 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[dce]: False",
|
| 48 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[static_weight_shapes]: True",
|
| 49 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[size_asserts]: True",
|
| 50 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[nan_asserts]: False",
|
| 51 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[scalar_asserts]: True",
|
| 52 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[pick_loop_orders]: True",
|
| 53 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[inplace_buffers]: True",
|
| 54 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[allow_buffer_reuse]: True",
|
| 55 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[memory_planning]: False",
|
| 56 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[use_fast_math]: False",
|
| 57 |
+
"[x75won4jmsgeb63pcvwr2y4eteyzzdhmf5rv6xhjppie4hx2yu5] inductor_config[memory_pool]: intermediates",
|
| 58 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[benchmark_harness]: True",
|
| 59 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[epilogue_fusion]: True",
|
| 60 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[prologue_fusion]: True",
|
| 61 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[epilogue_fusion_first]: False",
|
| 62 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[pattern_matcher]: True",
|
| 63 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[b2b_gemm_pass]: False",
|
| 64 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[joint_custom_pre_pass]: None",
|
| 65 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[joint_custom_post_pass]: None",
|
| 66 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[pre_grad_custom_pass]: None",
|
| 67 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[split_cat_fx_passes]: True",
|
| 68 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[efficient_conv_bn_eval_fx_passes]: False",
|
| 69 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[is_predispatch]: False",
|
| 70 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[group_fusion]: False",
|
| 71 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[batch_fusion]: True",
|
| 72 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[pre_grad_fusion_options]: {}",
|
| 73 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[post_grad_fusion_options]: {}",
|
| 74 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[reorder_for_locality]: True",
|
| 75 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[dynamic_scale_rblock]: True",
|
| 76 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_fuse_int_mm_with_mul]: False",
|
| 77 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[use_mixed_mm]: True",
|
| 78 |
+
"[zwmmbkdkarexuhbigurz5lfnhx64tht7fznecjkrvznh6rzivbv] inductor_config[fx_passes_numeric_check]: {'pre_grad': False, 'precision': 0.0001, 'num_iterations': 1, 'requires_optimizer': True}",
|
| 79 |
+
"[v2td5s4lnsvyxvaevy4chx6kc5h3mm2axazbgwimqule5zrzao7] inductor_config[mixed_mm_choice]: heuristic",
|
| 80 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[reorder_for_compute_comm_overlap]: False",
|
| 81 |
+
"[ssupi7bu3rrhdpg2jyegzncu3kg3nnhklyliqvutaxgs7y7k3dx] inductor_config[reorder_for_compute_comm_overlap_passes]: ['reorder_compute_for_overlap', 'sink_waits', 'raise_comms']",
|
| 82 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[reorder_for_peak_memory]: True",
|
| 83 |
+
"[lxxtoqhcoepwfokeiibd575gnxo3uzwiv4hmpomlwkpzqz3qzsh] inductor_config[estimate_op_runtime]: default",
|
| 84 |
+
"[yezuzjtg4h3jjur4jwtwiehbyixa7eonq4tqsqmwqve2lvvmrem] inductor_config[intra_node_bw]: 300",
|
| 85 |
+
"[5fxczt3ciyxitdhizb7sfsgn7fhpczcqsngttnt5ot2wyctk7co] inductor_config[inter_node_bw]: 25",
|
| 86 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[use_experimental_benchmarker]: True",
|
| 87 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[max_autotune]: True",
|
| 88 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[max_autotune_pointwise]: False",
|
| 89 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[max_autotune_gemm]: False",
|
| 90 |
+
"[j6c55jha5r2sdys2rwq7uqhtleea5dgjcye7nicfgft36v7xfvp] inductor_config[autotune_num_choices_displayed]: 10",
|
| 91 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[graph_partition]: False",
|
| 92 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_same_precision]: False",
|
| 93 |
+
"[2y7luesktjrque3nr7qtxnum2mkbeegzdrsvkm3rvdlhqboajhx] inductor_config[max_autotune_gemm_backends]: ATEN,TRITON,CPP",
|
| 94 |
+
"[uqlsbif4zxd75vt522p52txyuguieipi2lwz5g5awt56lccqk7s] inductor_config[max_autotune_conv_backends]: ATEN,TRITON",
|
| 95 |
+
"[jvchmi66fvqzlemhr5fcqorz5trfdtdalzfagtj2aolmimwqhdq] inductor_config[max_autotune_gemm_search_space]: DEFAULT",
|
| 96 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[autotune_fallback_to_aten]: True",
|
| 97 |
+
"[wft6ljqsfr3x4m7fa5zuyb7cwknky4irrxz4bjr6uzr2yiopxqj] inductor_config[unbacked_symint_fallback]: 8192",
|
| 98 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[search_autotune_cache]: False",
|
| 99 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[save_args]: False",
|
| 100 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[autotune_in_subproc]: False",
|
| 101 |
+
"[iglov24t7x5ruci344aer2tm6nqshi4veuw4wxlssxtu46cx76m] inductor_config[max_autotune_subproc_result_timeout_seconds]: 60.0",
|
| 102 |
+
"[bh33ranllcgilhgmgr3qvygzxjm6isq5iexnfm3zx6fnr2zwlp2] inductor_config[max_autotune_subproc_graceful_timeout_seconds]: 1.0",
|
| 103 |
+
"[pwoh5aypf4fxbntdvwt67rppxorqos6xr3w7qzeun6kblbfg2ga] inductor_config[max_autotune_subproc_terminate_timeout_seconds]: 2.0",
|
| 104 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[autotune_multi_device]: False",
|
| 105 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[coordinate_descent_tuning]: True",
|
| 106 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[coordinate_descent_check_all_directions]: False",
|
| 107 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[coordinate_descent_search_radius]: 1",
|
| 108 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[autoheuristic_collect]: ",
|
| 109 |
+
"[jwbrgxes7vjqumngs5hyj6gn5nytv2whnppnzngvaagfmawhkkd] inductor_config[autoheuristic_use]: mixed_mm",
|
| 110 |
+
"[jvchmi66fvqzlemhr5fcqorz5trfdtdalzfagtj2aolmimwqhdq] inductor_config[autoheuristic_log_path]: DEFAULT",
|
| 111 |
+
"[ngkkx5e6z7erl6da23zb2cmsctz4yvaqyameyg5hbqln4wrhh7x] inductor_config[layout_opt_default]: 0",
|
| 112 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[layout_optimization]: False",
|
| 113 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_layout_optimization]: False",
|
| 114 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[keep_output_stride]: True",
|
| 115 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[warn_mix_layout]: False",
|
| 116 |
+
"[lkkae3meylaixfif4thncru4hjqeaislawjoghffrbwuscaagei] inductor_config[realize_reads_threshold]: 4",
|
| 117 |
+
"[rr5m5hsocoyodldz7vcvaizdwvm2rt34evmqdxvng7wz3tufvo6] inductor_config[realize_opcount_threshold]: 30",
|
| 118 |
+
"[yttmfmxblgcbsvbokguzowcorrcxz5uunxtcvsbe6nijgcx45he] inductor_config[realize_acc_reads_threshold]: 8",
|
| 119 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[fallback_random]: False",
|
| 120 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[implicit_fallbacks]: True",
|
| 121 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aggressive_fusion]: False",
|
| 122 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug_fusion]: False",
|
| 123 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[benchmark_fusion]: False",
|
| 124 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[enabled_metric_tables]: ",
|
| 125 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[loop_ordering_after_fusion]: False",
|
| 126 |
+
"[j6c55jha5r2sdys2rwq7uqhtleea5dgjcye7nicfgft36v7xfvp] inductor_config[score_fusion_memory_threshold]: 10",
|
| 127 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[benchmark_epilogue_fusion]: True",
|
| 128 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[max_epilogue_benchmarked_choices]: 1",
|
| 129 |
+
"[jykiys6ynafs3zdylwa5ggq6j655mxeh42d6mtdi22gffkrmiac] inductor_config[max_fusion_size]: 64",
|
| 130 |
+
"[yttmfmxblgcbsvbokguzowcorrcxz5uunxtcvsbe6nijgcx45he] inductor_config[max_pointwise_cat_inputs]: 8",
|
| 131 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_pointwise_cat]: False",
|
| 132 |
+
"[yttmfmxblgcbsvbokguzowcorrcxz5uunxtcvsbe6nijgcx45he] inductor_config[unroll_reductions_threshold]: 8",
|
| 133 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[comment_origin]: False",
|
| 134 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[conv_1x1_as_mm]: False",
|
| 135 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[split_reductions]: True",
|
| 136 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[benchmark_kernel]: False",
|
| 137 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[constant_and_index_propagation]: True",
|
| 138 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[always_keep_tensor_constants]: False",
|
| 139 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[assert_indirect_indexing]: True",
|
| 140 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[compute_all_bounds]: False",
|
| 141 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[combo_kernels]: False",
|
| 142 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[benchmark_combo_kernel]: False",
|
| 143 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[combo_kernels_autotune]: 1",
|
| 144 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[combo_kernel_allow_mixed_sizes]: 1",
|
| 145 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[combo_kernel_foreach_dynamic_shapes]: False",
|
| 146 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[joint_graph_constant_folding]: True",
|
| 147 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug_index_asserts]: False",
|
| 148 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[emulate_precision_casts]: False",
|
| 149 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[is_nightly_or_source]: False",
|
| 150 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[developer_warnings]: False",
|
| 151 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[optimize_scatter_upon_const_tensor]: True",
|
| 152 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[add_pre_grad_passes]: None",
|
| 153 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[remove_pre_grad_passes]: None",
|
| 154 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[global_cache_dir]: None",
|
| 155 |
+
"[j6c55jha5r2sdys2rwq7uqhtleea5dgjcye7nicfgft36v7xfvp] inductor_config[kernel_name_max_ops]: 10",
|
| 156 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[shape_padding]: True",
|
| 157 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[comprehensive_padding]: True",
|
| 158 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[pad_channels_last]: False",
|
| 159 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[disable_padding_cpu]: True",
|
| 160 |
+
"[ljdqgtysl3vdf7j6attlz5gmjg2ncihnveojfyubosplmkrjgra] inductor_config[padding_alignment_bytes]: 128",
|
| 161 |
+
"[dnnw5ks3yxrp7mwvihb2hh4tqx35ye637xt33x64kw4fvz2nyzg] inductor_config[padding_stride_threshold]: 1024",
|
| 162 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[pad_outputs]: False",
|
| 163 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[bw_outputs_user_visible]: True",
|
| 164 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_shape_pad]: False",
|
| 165 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[permute_fusion]: False",
|
| 166 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[profiler_mark_wrapper_call]: False",
|
| 167 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[generate_intermediate_hooks]: False",
|
| 168 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug_ir_traceback]: False",
|
| 169 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[profile_bandwidth]: False",
|
| 170 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[profile_bandwidth_regex]: ",
|
| 171 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[profile_bandwidth_output]: None",
|
| 172 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[profile_bandwidth_with_do_bench_using_profiling]: False",
|
| 173 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[disable_cpp_codegen]: False",
|
| 174 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[freezing]: False",
|
| 175 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[freezing_discard_parameters]: False",
|
| 176 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[decompose_mem_bound_mm]: False",
|
| 177 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[assume_aligned_inputs]: False",
|
| 178 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[unsafe_ignore_unsupported_triton_autotune_args]: False",
|
| 179 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[check_stack_no_cycles_TESTING_ONLY]: False",
|
| 180 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[enable_linear_binary_folding]: False",
|
| 181 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[annotate_training]: False",
|
| 182 |
+
"[sz3im5ogc6asp7g4uqocnovype63tkdexzfrniv6hn2oank3biu] inductor_config[cpp.threads]: -1",
|
| 183 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.no_redundant_loops]: True",
|
| 184 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.dynamic_threads]: False",
|
| 185 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.simdlen]: None",
|
| 186 |
+
"[g7rrnbg5yonzux3cfj5ovre5lob3ayda7qcfpxjvtwmiz4uicii] inductor_config[cpp.min_chunk_size]: 4096",
|
| 187 |
+
"[c7zj4qytmety6keurs3hsh5wn7foxp3dqx4kym2ucszzcb2ngrf] inductor_config[cpp.cxx]: (None, 'g++')",
|
| 188 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_kernel_profile]: False",
|
| 189 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.weight_prepack]: True",
|
| 190 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.inject_relu_bug_TESTING_ONLY]: None",
|
| 191 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.inject_log1p_bug_TESTING_ONLY]: None",
|
| 192 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.vec_isa_ok]: None",
|
| 193 |
+
"[yrty22bseefglnysuoec4ji7j2rnaggdj3g33zzj7avogwfmgdw] inductor_config[cpp.descriptive_names]: original_aten",
|
| 194 |
+
"[ebt2ncs4f5y7dn7btzi76mnouepvzad474tmp5iju4wiuumjl4s] inductor_config[cpp.max_horizontal_fusion_size]: 16",
|
| 195 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.fallback_scatter_reduce_sum]: True",
|
| 196 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_unsafe_math_opt_flag]: False",
|
| 197 |
+
"[ijs44lspkinjvhcs7uff7n3noc53jvsp4yfljjh22mafhb7khxe] inductor_config[cpp.enable_floating_point_contract_flag]: off",
|
| 198 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.enable_tiling_heuristics]: True",
|
| 199 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_grouped_gemm_template]: False",
|
| 200 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[cpp.gemm_max_k_slices]: 1",
|
| 201 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.gemm_cache_blocking]: None",
|
| 202 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.gemm_thread_factors]: None",
|
| 203 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.enable_loop_tail_vec]: True",
|
| 204 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_concat_linear]: False",
|
| 205 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cudagraphs]: False",
|
| 206 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.cudagraph_trees]: True",
|
| 207 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cudagraph_skip_dynamic_graphs]: False",
|
| 208 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.slow_path_cudagraph_asserts]: True",
|
| 209 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cudagraph_trees_history_recording]: False",
|
| 210 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.cudagraph_support_input_mutation]: True",
|
| 211 |
+
"[ljdqgtysl3vdf7j6attlz5gmjg2ncihnveojfyubosplmkrjgra] inductor_config[triton.cudagraph_unexpected_rerecord_limit]: 128",
|
| 212 |
+
"[tuax46wac7rfv2trf5gcps6vleo3cq44lbnrdxtprvo3ljjaddj] inductor_config[triton.cudagraph_dynamic_shape_warn_limit]: 50",
|
| 213 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.force_cudagraph_sync]: False",
|
| 214 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.force_cudagraphs_warmup]: False",
|
| 215 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.fast_path_cudagraph_asserts]: False",
|
| 216 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.skip_cudagraph_warmup]: False",
|
| 217 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.debug_sync_graph]: False",
|
| 218 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.debug_sync_kernel]: False",
|
| 219 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.dense_indexing]: False",
|
| 220 |
+
"[pr5nr4a7dthirgd2ljo3d2xakc63ywxugusu6mkmr6gmpeliyib] inductor_config[triton.max_tiles]: 2",
|
| 221 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.prefer_nd_tiling]: False",
|
| 222 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.autotune_pointwise]: True",
|
| 223 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.autotune_cublasLt]: True",
|
| 224 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[triton.autotune_at_compile_time]: None",
|
| 225 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.tile_reductions]: False",
|
| 226 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.tiling_prevents_pointwise_fusion]: True",
|
| 227 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.tiling_prevents_reduction_fusion]: True",
|
| 228 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.unique_kernel_names]: True",
|
| 229 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.unique_user_kernel_names]: False",
|
| 230 |
+
"[yrty22bseefglnysuoec4ji7j2rnaggdj3g33zzj7avogwfmgdw] inductor_config[triton.descriptive_names]: original_aten",
|
| 231 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.persistent_reductions]: True",
|
| 232 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cooperative_reductions]: False",
|
| 233 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.force_cooperative_reductions]: False",
|
| 234 |
+
"[vrl5ktomgtzox5xucd3np6vug3vyj6hwwzahqijuwpmamlv7ohi] inductor_config[triton.multi_kernel]: 0",
|
| 235 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.divisible_by_16]: True",
|
| 236 |
+
"[fv6slhtedtydps5s5u2etitscliblzcidyitqf7krsv4e23fzk6] inductor_config[triton.min_split_scan_rblock]: 256",
|
| 237 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.store_cubin]: False",
|
| 238 |
+
"[ebt2ncs4f5y7dn7btzi76mnouepvzad474tmp5iju4wiuumjl4s] inductor_config[triton.spill_threshold]: 16",
|
| 239 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.use_block_ptr]: False",
|
| 240 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[triton.inject_relu_bug_TESTING_ONLY]: None",
|
| 241 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.codegen_upcast_to_fp32]: True",
|
| 242 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.enable_persistent_tma_matmul]: False",
|
| 243 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.skip_l1_cache]: False",
|
| 244 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.disallow_failing_autotune_kernels_TESTING_ONLY]: False",
|
| 245 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[aot_inductor.output_path]: ",
|
| 246 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.debug_compile]: False",
|
| 247 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.compile_wrapper_with_O0]: False",
|
| 248 |
+
"[ngkkx5e6z7erl6da23zb2cmsctz4yvaqyameyg5hbqln4wrhh7x] inductor_config[aot_inductor.debug_intermediate_value_printer]: 0",
|
| 249 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[aot_inductor.filtered_kernel_names]: None",
|
| 250 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[aot_inductor.serialized_in_spec]: ",
|
| 251 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[aot_inductor.serialized_out_spec]: ",
|
| 252 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.use_runtime_constant_folding]: False",
|
| 253 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.force_mmap_weights]: False",
|
| 254 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.package]: False",
|
| 255 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.package_cpp_only]: False",
|
| 256 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[aot_inductor.metadata]: {}",
|
| 257 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[aot_inductor.raise_error_on_ignored_optimization]: True",
|
| 258 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.dump_aoti_minifier]: False",
|
| 259 |
+
"[pr5nr4a7dthirgd2ljo3d2xakc63ywxugusu6mkmr6gmpeliyib] inductor_config[aot_inductor.repro_level]: 2",
|
| 260 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[aot_inductor.presets]: {}",
|
| 261 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.allow_stack_allocation]: False",
|
| 262 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.use_minimal_arrayref_interface]: False",
|
| 263 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[aot_inductor.package_constants_in_so]: True",
|
| 264 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.arch]: None",
|
| 265 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.version]: None",
|
| 266 |
+
"[tvyftmtdmezlejo2xllu7awzv4pzc4vm4fub4b3gpl5jptjkosi] inductor_config[cuda.compile_opt_level]: -O1",
|
| 267 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.enable_cuda_lto]: False",
|
| 268 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.enable_ptxas_info]: False",
|
| 269 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.enable_debug_info]: False",
|
| 270 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.use_fast_math]: False",
|
| 271 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cutlass_max_profiling_configs]: None",
|
| 272 |
+
"[xaicuyqjstadzph6cgvxowlzizkts6kzmfupsnbyaorxh37cppz] inductor_config[cuda.cutlass_max_profiling_swizzle_options]: [1, 2, 4]",
|
| 273 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cuda_cxx]: None",
|
| 274 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[cuda.cutlass_backend_min_gemm_size]: 1",
|
| 275 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.generate_test_runner]: False",
|
| 276 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cutlass_op_allowlist_regex]: None",
|
| 277 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cutlass_op_denylist_regex]: None",
|
| 278 |
+
"[ngkkx5e6z7erl6da23zb2cmsctz4yvaqyameyg5hbqln4wrhh7x] inductor_config[cuda.cutlass_instantiation_level]: 0",
|
| 279 |
+
"[h25wqx6vliw4j5rtzzbv6latydxyei3deyg6v7wzvnzryfktuki] inductor_config[rocm.arch]: []",
|
| 280 |
+
"[3w3j4h2iiu3addwyb5alaeecz3so7teb23hp4d5n3b46w5n73ur] inductor_config[rocm.ck_supported_arch]: ['gfx90a', 'gfx942']",
|
| 281 |
+
"[klfqjprnpfhcdurgvuikvc4rpd5ynkpk77toousr5h3u5roty6p] inductor_config[rocm.compile_opt_level]: -O2",
|
| 282 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.is_debug]: False",
|
| 283 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.save_temps]: False",
|
| 284 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[rocm.use_fast_math]: True",
|
| 285 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[rocm.flush_denormals]: True",
|
| 286 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.print_kernel_resource_usage]: False",
|
| 287 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.rocm_home]: None",
|
| 288 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.ck_dir]: None",
|
| 289 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.generate_test_runner]: False",
|
| 290 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.n_max_profiling_configs]: None",
|
| 291 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.use_preselected_instances]: False",
|
| 292 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.kBatch_sweep]: None",
|
| 293 |
+
"[ebt2ncs4f5y7dn7btzi76mnouepvzad474tmp5iju4wiuumjl4s] inductor_config[rocm.split_k_threshold]: 16",
|
| 294 |
+
"[bsvfcwwoczx2rlkdz2eta6doujsymyihmi46hhwk6clrrvwcb6m] inductor_config[cpu_backend]: cpp",
|
| 295 |
+
"[caw4ly2z672k6kjfahoxwpajp5idhhtrpgf3ma2clylcp7c7aid] inductor_config[cuda_backend]: triton",
|
| 296 |
+
"[ljhgflgihidopsfsdcbqynv27nceykby3nutyd5jlcpq7n6e7l4] inductor_config[halide.cpu_target]: host",
|
| 297 |
+
"[wx7vmsmrdpk5ue2txlywp3lj3faqmdjphs5fgg2ehzsyno7uovg] inductor_config[halide.gpu_target]: host-cuda",
|
| 298 |
+
"[svgytlua5wcyeia7wq7e6zgh5tsueikrnzchmdmouvmkpfsc2zq] inductor_config[halide.scheduler_cuda]: Anderson2021",
|
| 299 |
+
"[k5ogk6345jvklsnu7g2njqstiz2g6pm5wmqpgg3kasrmuqwjvl6] inductor_config[halide.scheduler_cpu]: Adams2019",
|
| 300 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[halide.asserts]: False",
|
| 301 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[halide.debug]: False",
|
| 302 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[halide.scan_kernels]: False",
|
| 303 |
+
"[h25wqx6vliw4j5rtzzbv6latydxyei3deyg6v7wzvnzryfktuki] inductor_config[external_matmul]: []",
|
| 304 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[test_configs.force_extern_kernel_in_multi_template]: False",
|
| 305 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[test_configs.max_mm_configs]: None",
|
| 306 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[test_configs.runtime_triton_dtype_assert]: False",
|
| 307 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[test_configs.autotune_choice_name_regex]: None",
|
| 308 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[test_configs.autotune_choice_desc_regex]: None",
|
| 309 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[test_configs.graphsafe_rng_func_ignores_fallback_random]: False",
|
| 310 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] post_grad_custom_pre_pass: None",
|
| 311 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] post_grad_custom_post_pass: None"
|
| 312 |
+
],
|
| 313 |
+
"key": "fr57fwh6rfk65wtgsmaeq6p7domzwaxezpig6cnku7tl6zrhoujz",
|
| 314 |
+
"time_saved_ns": 427407491
|
| 315 |
+
}
|
-_0_0_0/inductor_output_code_ch44xxkifazlcpkp6mi44xhqeej2j5mbgwmesiwx6y3oajzmixxp_7.html
ADDED
|
@@ -0,0 +1,67 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
<pre style="background-color:#ffffff;">
|
| 2 |
+
<span style="font-style:italic;color:#969896;"># AOT ID: ['0_inference']
|
| 3 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">ctypes </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">c_void_p, c_long, c_int
|
| 4 |
+
</span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">torch
|
| 5 |
+
</span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">math
|
| 6 |
+
</span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">random
|
| 7 |
+
</span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">os
|
| 8 |
+
</span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">tempfile
|
| 9 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">math </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">inf, nan
|
| 10 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">cmath </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">nanj
|
| 11 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch._inductor.hooks </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">run_intermediate_hooks
|
| 12 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch._inductor.utils </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">maybe_profile
|
| 13 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch._inductor.codegen.memory_planning </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">_align </span><span style="font-weight:bold;color:#a71d5d;">as </span><span style="color:#323232;">align
|
| 14 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">device, empty_strided
|
| 15 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch._inductor.async_compile </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">AsyncCompile
|
| 16 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch._inductor.select_algorithm </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">extern_kernels
|
| 17 |
+
</span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch._inductor.codegen.multi_kernel </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">MultiKernelCall
|
| 18 |
+
</span><span style="color:#323232;">
|
| 19 |
+
</span><span style="color:#323232;">aten </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.ops.aten
|
| 20 |
+
</span><span style="color:#323232;">inductor_ops </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.ops.inductor
|
| 21 |
+
</span><span style="color:#323232;">_quantized </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.ops._quantized
|
| 22 |
+
</span><span style="color:#323232;">assert_size_stride </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.</span><span style="color:#0086b3;">_C</span><span style="color:#323232;">._dynamo.guards.assert_size_stride
|
| 23 |
+
</span><span style="color:#323232;">empty_strided_cpu </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.</span><span style="color:#0086b3;">_C</span><span style="color:#323232;">._dynamo.guards._empty_strided_cpu
|
| 24 |
+
</span><span style="color:#323232;">empty_strided_cuda </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.</span><span style="color:#0086b3;">_C</span><span style="color:#323232;">._dynamo.guards._empty_strided_cuda
|
| 25 |
+
</span><span style="color:#323232;">empty_strided_xpu </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.</span><span style="color:#0086b3;">_C</span><span style="color:#323232;">._dynamo.guards._empty_strided_xpu
|
| 26 |
+
</span><span style="color:#323232;">reinterpret_tensor </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.</span><span style="color:#0086b3;">_C</span><span style="color:#323232;">._dynamo.guards._reinterpret_tensor
|
| 27 |
+
</span><span style="color:#323232;">alloc_from_pool </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.ops.inductor._alloc_from_pool
|
| 28 |
+
</span><span style="color:#323232;">async_compile </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">AsyncCompile()
|
| 29 |
+
</span><span style="color:#323232;">empty_strided_p2p </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.</span><span style="color:#0086b3;">_C</span><span style="color:#323232;">._distributed_c10d._SymmetricMemory.empty_strided_p2p
|
| 30 |
+
</span><span style="color:#323232;">
|
| 31 |
+
</span><span style="color:#323232;">
|
| 32 |
+
</span><span style="color:#323232;">async_compile.wait(</span><span style="color:#62a35c;">globals</span><span style="color:#323232;">())
|
| 33 |
+
</span><span style="font-weight:bold;color:#a71d5d;">del </span><span style="color:#323232;">async_compile
|
| 34 |
+
</span><span style="color:#323232;">
|
| 35 |
+
</span><span style="font-weight:bold;color:#a71d5d;">def </span><span style="font-weight:bold;color:#323232;">call</span><span style="color:#323232;">(args):
|
| 36 |
+
</span><span style="color:#323232;"> arg0_1, arg1_1, arg2_1 </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">args
|
| 37 |
+
</span><span style="color:#323232;"> args.clear()
|
| 38 |
+
</span><span style="color:#323232;"> assert_size_stride(arg0_1, (</span><span style="color:#0086b3;">4096</span><span style="color:#323232;">, </span><span style="color:#0086b3;">8192</span><span style="color:#323232;">), (</span><span style="color:#0086b3;">8192</span><span style="color:#323232;">, </span><span style="color:#0086b3;">1</span><span style="color:#323232;">))
|
| 39 |
+
</span><span style="color:#323232;"> assert_size_stride(arg1_1, (</span><span style="color:#0086b3;">4096</span><span style="color:#323232;">, ), (</span><span style="color:#0086b3;">1</span><span style="color:#323232;">, ))
|
| 40 |
+
</span><span style="color:#323232;"> assert_size_stride(arg2_1, (</span><span style="color:#0086b3;">4096</span><span style="color:#323232;">, ), (</span><span style="color:#0086b3;">1</span><span style="color:#323232;">, ))
|
| 41 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">with </span><span style="color:#323232;">torch.cuda._DeviceGuard(</span><span style="color:#0086b3;">0</span><span style="color:#323232;">):
|
| 42 |
+
</span><span style="color:#323232;"> torch.cuda.set_device(</span><span style="color:#0086b3;">0</span><span style="color:#323232;">)
|
| 43 |
+
</span><span style="color:#323232;"> </span><span style="font-style:italic;color:#969896;"># Topologically Sorted Source Nodes: [scaled_fake_quantize], Original ATen: [quark.scaled_fake_quantize]
|
| 44 |
+
</span><span style="color:#323232;"> buf0 </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">torch.ops.quark.scaled_fake_quantize.default(</span><span style="color:#183691;">'int4'</span><span style="color:#323232;">, arg0_1, arg1_1, arg2_1, </span><span style="color:#0086b3;">0</span><span style="color:#323232;">, </span><span style="color:#0086b3;">0</span><span style="color:#323232;">, </span><span style="color:#0086b3;">0.0</span><span style="color:#323232;">, </span><span style="color:#0086b3;">15.0</span><span style="color:#323232;">, </span><span style="color:#0086b3;">0</span><span style="color:#323232;">, </span><span style="color:#183691;">'per_channel'</span><span style="color:#323232;">, </span><span style="color:#183691;">'haha'</span><span style="color:#323232;">)
|
| 45 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">del </span><span style="color:#323232;">arg0_1
|
| 46 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">del </span><span style="color:#323232;">arg1_1
|
| 47 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">del </span><span style="color:#323232;">arg2_1
|
| 48 |
+
</span><span style="color:#323232;"> buf1 </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">buf0
|
| 49 |
+
</span><span style="color:#323232;"> assert_size_stride(buf1, (</span><span style="color:#0086b3;">4096</span><span style="color:#323232;">, </span><span style="color:#0086b3;">8192</span><span style="color:#323232;">), (</span><span style="color:#0086b3;">8192</span><span style="color:#323232;">, </span><span style="color:#0086b3;">1</span><span style="color:#323232;">))
|
| 50 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">del </span><span style="color:#323232;">buf0
|
| 51 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">return </span><span style="color:#323232;">(buf1, )
|
| 52 |
+
</span><span style="color:#323232;">
|
| 53 |
+
</span><span style="color:#323232;">
|
| 54 |
+
</span><span style="font-weight:bold;color:#a71d5d;">def </span><span style="font-weight:bold;color:#323232;">benchmark_compiled_module</span><span style="color:#323232;">(times</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#0086b3;">10</span><span style="color:#323232;">, repeat</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#0086b3;">10</span><span style="color:#323232;">):
|
| 55 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch._dynamo.testing </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">rand_strided
|
| 56 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch._inductor.utils </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">print_performance
|
| 57 |
+
</span><span style="color:#323232;"> arg0_1 </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">rand_strided((</span><span style="color:#0086b3;">4096</span><span style="color:#323232;">, </span><span style="color:#0086b3;">8192</span><span style="color:#323232;">), (</span><span style="color:#0086b3;">8192</span><span style="color:#323232;">, </span><span style="color:#0086b3;">1</span><span style="color:#323232;">), device</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#183691;">'cuda:0'</span><span style="color:#323232;">, dtype</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#323232;">torch.float32)
|
| 58 |
+
</span><span style="color:#323232;"> arg1_1 </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">rand_strided((</span><span style="color:#0086b3;">4096</span><span style="color:#323232;">, ), (</span><span style="color:#0086b3;">1</span><span style="color:#323232;">, ), device</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#183691;">'cuda:0'</span><span style="color:#323232;">, dtype</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#323232;">torch.float32)
|
| 59 |
+
</span><span style="color:#323232;"> arg2_1 </span><span style="font-weight:bold;color:#a71d5d;">= </span><span style="color:#323232;">rand_strided((</span><span style="color:#0086b3;">4096</span><span style="color:#323232;">, ), (</span><span style="color:#0086b3;">1</span><span style="color:#323232;">, ), device</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#183691;">'cuda:0'</span><span style="color:#323232;">, dtype</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#323232;">torch.int32)
|
| 60 |
+
</span><span style="color:#323232;"> fn </span><span style="font-weight:bold;color:#a71d5d;">= lambda</span><span style="color:#323232;">: call([arg0_1, arg1_1, arg2_1])
|
| 61 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">return </span><span style="color:#323232;">print_performance(fn, times</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#323232;">times, repeat</span><span style="font-weight:bold;color:#a71d5d;">=</span><span style="color:#323232;">repeat)
|
| 62 |
+
</span><span style="color:#323232;">
|
| 63 |
+
</span><span style="color:#323232;">
|
| 64 |
+
</span><span style="font-weight:bold;color:#a71d5d;">if </span><span style="color:#323232;">__name__ </span><span style="font-weight:bold;color:#a71d5d;">== </span><span style="color:#183691;">"__main__"</span><span style="color:#323232;">:
|
| 65 |
+
</span><span style="color:#323232;"> </span><span style="font-weight:bold;color:#a71d5d;">from </span><span style="color:#323232;">torch._inductor.wrapper_benchmark </span><span style="font-weight:bold;color:#a71d5d;">import </span><span style="color:#323232;">compiled_module_main
|
| 66 |
+
</span><span style="color:#323232;"> compiled_module_main(</span><span style="color:#183691;">'None'</span><span style="color:#323232;">, benchmark_compiled_module)
|
| 67 |
+
</span></pre>
|
-_0_0_0/inductor_pre_grad_graph_1.txt
ADDED
|
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
class GraphModule(torch.nn.Module):
|
| 2 |
+
def forward(self, L_w_: "f32[4096, 8192][8192, 1]cuda:0", L_scale_: "f32[4096][1]cuda:0", L_zero_point_: "i32[4096][1]cuda:0"):
|
| 3 |
+
l_w_ = L_w_
|
| 4 |
+
l_scale_ = L_scale_
|
| 5 |
+
l_zero_point_ = L_zero_point_
|
| 6 |
+
|
| 7 |
+
# File: /shared_volume/repos/quark/bench_qdq.py:8 in run_scaled_fake_quantize, code: return scaled_fake_quantize(quant_dtype, w, scale, zero_point, axis, group_size, quant_min, quant_max, round_mode, qscheme, mx_element_dtype)
|
| 8 |
+
function_ctx = torch.autograd.function.FunctionCtx(); function_ctx = None
|
| 9 |
+
|
| 10 |
+
# File: /shared_volume/repos/quark/quark/torch/kernel/__init__.py:168 in forward, code: return ops.quark.scaled_fake_quantize(quant_dtype, inputs, scale, zero_point, axis, group_size, quant_min,
|
| 11 |
+
scaled_fake_quantize: "f32[4096, 8192][8192, 1]cuda:0" = torch.ops.quark.scaled_fake_quantize('int4', l_w_, l_scale_, l_zero_point_, 0, 0, 0, 15, 0, 'per_channel', 'haha'); l_w_ = l_scale_ = l_zero_point_ = None
|
| 12 |
+
return (scaled_fake_quantize,)
|
| 13 |
+
|
| 14 |
+
|
| 15 |
+
# graph id: 140371115438448
|
-_0_0_0/torch._functorch.config_6.txt
ADDED
|
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"TYPE_CHECKING": false,
|
| 3 |
+
"functionalize_rng_ops": false,
|
| 4 |
+
"fake_tensor_allow_meta": true,
|
| 5 |
+
"debug_assert": false,
|
| 6 |
+
"debug_partitioner": false,
|
| 7 |
+
"decompose_custom_triton_ops": true,
|
| 8 |
+
"static_weight_shapes": true,
|
| 9 |
+
"cse": true,
|
| 10 |
+
"enable_autograd_cache": true,
|
| 11 |
+
"enable_remote_autograd_cache": null,
|
| 12 |
+
"view_replay_for_aliased_outputs": true,
|
| 13 |
+
"max_dist_from_bw": 1000,
|
| 14 |
+
"ban_recompute_used_far_apart": true,
|
| 15 |
+
"ban_recompute_long_fusible_chains": true,
|
| 16 |
+
"ban_recompute_materialized_backward": true,
|
| 17 |
+
"ban_recompute_not_in_allowlist": true,
|
| 18 |
+
"ban_recompute_reductions": true,
|
| 19 |
+
"recompute_views": false,
|
| 20 |
+
"activation_memory_budget": 1.0,
|
| 21 |
+
"activation_memory_budget_runtime_estimator": "flops",
|
| 22 |
+
"activation_memory_budget_solver": "dp",
|
| 23 |
+
"visualize_memory_budget_pareto": false,
|
| 24 |
+
"memory_budget_pareto_dir": null,
|
| 25 |
+
"aggressive_recomputation": false,
|
| 26 |
+
"fake_tensor_allow_unsafe_data_ptr_access": true,
|
| 27 |
+
"unlift_effect_tokens": true,
|
| 28 |
+
"fake_tensor_crossref": false,
|
| 29 |
+
"fake_tensor_propagate_real_tensors": false,
|
| 30 |
+
"donated_buffer": true,
|
| 31 |
+
"torch_compile_graph_format": "svg",
|
| 32 |
+
"generate_fake_kernels_from_real_mismatches": false,
|
| 33 |
+
"graphsafe_rng_functionalization": true,
|
| 34 |
+
"strict_autograd_cache": false,
|
| 35 |
+
"disable_guess_zero_tangent_for_mutated_input_subclass": false
|
| 36 |
+
}
|
chromium_events.json
ADDED
|
@@ -0,0 +1,962 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
[
|
| 2 |
+
{
|
| 3 |
+
"args": {
|
| 4 |
+
"compile_id": "0/0"
|
| 5 |
+
},
|
| 6 |
+
"cat": "dynamo_timed",
|
| 7 |
+
"name": "dynamo",
|
| 8 |
+
"ph": "B",
|
| 9 |
+
"pid": 0,
|
| 10 |
+
"tid": 0,
|
| 11 |
+
"ts": 1750251841454820.0
|
| 12 |
+
},
|
| 13 |
+
{
|
| 14 |
+
"args": {
|
| 15 |
+
"compile_id": "0/0",
|
| 16 |
+
"fn_name": "_compile.compile_inner"
|
| 17 |
+
},
|
| 18 |
+
"cat": "dynamo_timed",
|
| 19 |
+
"name": "entire_frame_compile",
|
| 20 |
+
"ph": "B",
|
| 21 |
+
"pid": 0,
|
| 22 |
+
"tid": 0,
|
| 23 |
+
"ts": 1750251841482125.8
|
| 24 |
+
},
|
| 25 |
+
{
|
| 26 |
+
"args": {
|
| 27 |
+
"compile_id": "0/0",
|
| 28 |
+
"fn_name": "OutputGraph.call_user_compiler"
|
| 29 |
+
},
|
| 30 |
+
"cat": "dynamo_timed",
|
| 31 |
+
"name": "backend_compile",
|
| 32 |
+
"ph": "B",
|
| 33 |
+
"pid": 0,
|
| 34 |
+
"tid": 0,
|
| 35 |
+
"ts": 1750251841551173.2
|
| 36 |
+
},
|
| 37 |
+
{
|
| 38 |
+
"args": {
|
| 39 |
+
"compile_id": "0/0"
|
| 40 |
+
},
|
| 41 |
+
"cat": "dynamo_timed",
|
| 42 |
+
"name": "_recursive_pre_grad_passes",
|
| 43 |
+
"ph": "B",
|
| 44 |
+
"pid": 0,
|
| 45 |
+
"tid": 0,
|
| 46 |
+
"ts": 1750251841778018.5
|
| 47 |
+
},
|
| 48 |
+
{
|
| 49 |
+
"args": {
|
| 50 |
+
"compile_id": "0/0"
|
| 51 |
+
},
|
| 52 |
+
"cat": "dynamo_timed",
|
| 53 |
+
"name": "_recursive_pre_grad_passes",
|
| 54 |
+
"ph": "E",
|
| 55 |
+
"pid": 0,
|
| 56 |
+
"tid": 0,
|
| 57 |
+
"ts": 1750251841791426.5
|
| 58 |
+
},
|
| 59 |
+
{
|
| 60 |
+
"args": {
|
| 61 |
+
"compile_id": "0/0"
|
| 62 |
+
},
|
| 63 |
+
"cat": "dynamo_timed",
|
| 64 |
+
"name": "create_aot_dispatcher_function",
|
| 65 |
+
"ph": "B",
|
| 66 |
+
"pid": 0,
|
| 67 |
+
"tid": 0,
|
| 68 |
+
"ts": 1750251841793402.5
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"args": {
|
| 72 |
+
"compile_id": "0/0"
|
| 73 |
+
},
|
| 74 |
+
"cat": "dynamo_timed",
|
| 75 |
+
"name": "compile_fx.<locals>.fw_compiler_base",
|
| 76 |
+
"ph": "B",
|
| 77 |
+
"pid": 0,
|
| 78 |
+
"tid": 0,
|
| 79 |
+
"ts": 1750251841814442.2
|
| 80 |
+
},
|
| 81 |
+
{
|
| 82 |
+
"args": {
|
| 83 |
+
"compile_id": "0/0"
|
| 84 |
+
},
|
| 85 |
+
"cat": "dynamo_timed",
|
| 86 |
+
"name": "_recursive_joint_graph_passes",
|
| 87 |
+
"ph": "B",
|
| 88 |
+
"pid": 0,
|
| 89 |
+
"tid": 0,
|
| 90 |
+
"ts": 1750251841815353.0
|
| 91 |
+
},
|
| 92 |
+
{
|
| 93 |
+
"args": {
|
| 94 |
+
"compile_id": "0/0"
|
| 95 |
+
},
|
| 96 |
+
"cat": "dynamo_timed",
|
| 97 |
+
"name": "_recursive_joint_graph_passes",
|
| 98 |
+
"ph": "E",
|
| 99 |
+
"pid": 0,
|
| 100 |
+
"tid": 0,
|
| 101 |
+
"ts": 1750251842111758.2
|
| 102 |
+
},
|
| 103 |
+
{
|
| 104 |
+
"args": {
|
| 105 |
+
"compile_id": "0/0",
|
| 106 |
+
"fn_name": "compile_fx_inner"
|
| 107 |
+
},
|
| 108 |
+
"cat": "dynamo_timed",
|
| 109 |
+
"name": "inductor_compile",
|
| 110 |
+
"ph": "B",
|
| 111 |
+
"pid": 0,
|
| 112 |
+
"tid": 0,
|
| 113 |
+
"ts": 1750251842112457.0
|
| 114 |
+
},
|
| 115 |
+
{
|
| 116 |
+
"args": {
|
| 117 |
+
"compile_id": "0/0"
|
| 118 |
+
},
|
| 119 |
+
"cat": "dynamo_timed",
|
| 120 |
+
"name": "inductor_codecache_torch_key",
|
| 121 |
+
"ph": "B",
|
| 122 |
+
"pid": 0,
|
| 123 |
+
"tid": 0,
|
| 124 |
+
"ts": 1750251842118406.0
|
| 125 |
+
},
|
| 126 |
+
{
|
| 127 |
+
"args": {
|
| 128 |
+
"compile_id": "0/0"
|
| 129 |
+
},
|
| 130 |
+
"cat": "dynamo_timed",
|
| 131 |
+
"name": "inductor_codecache_torch_key",
|
| 132 |
+
"ph": "E",
|
| 133 |
+
"pid": 0,
|
| 134 |
+
"tid": 0,
|
| 135 |
+
"ts": 1750251842234516.2
|
| 136 |
+
},
|
| 137 |
+
{
|
| 138 |
+
"args": {
|
| 139 |
+
"compile_id": "0/0"
|
| 140 |
+
},
|
| 141 |
+
"cat": "dynamo_timed",
|
| 142 |
+
"name": "PyCodeCache.load_by_key_path",
|
| 143 |
+
"ph": "B",
|
| 144 |
+
"pid": 0,
|
| 145 |
+
"tid": 0,
|
| 146 |
+
"ts": 1750251842504139.8
|
| 147 |
+
},
|
| 148 |
+
{
|
| 149 |
+
"args": {
|
| 150 |
+
"compile_id": "0/0"
|
| 151 |
+
},
|
| 152 |
+
"cat": "dynamo_timed",
|
| 153 |
+
"name": "async_compile.wait",
|
| 154 |
+
"ph": "B",
|
| 155 |
+
"pid": 0,
|
| 156 |
+
"tid": 0,
|
| 157 |
+
"ts": 1750251842508906.2
|
| 158 |
+
},
|
| 159 |
+
{
|
| 160 |
+
"args": {
|
| 161 |
+
"compile_id": "0/0"
|
| 162 |
+
},
|
| 163 |
+
"cat": "dynamo_timed",
|
| 164 |
+
"name": "async_compile.wait",
|
| 165 |
+
"ph": "E",
|
| 166 |
+
"pid": 0,
|
| 167 |
+
"tid": 0,
|
| 168 |
+
"ts": 1750251842509594.5
|
| 169 |
+
},
|
| 170 |
+
{
|
| 171 |
+
"args": {
|
| 172 |
+
"compile_id": "0/0"
|
| 173 |
+
},
|
| 174 |
+
"cat": "dynamo_timed",
|
| 175 |
+
"name": "PyCodeCache.load_by_key_path",
|
| 176 |
+
"ph": "E",
|
| 177 |
+
"pid": 0,
|
| 178 |
+
"tid": 0,
|
| 179 |
+
"ts": 1750251842509931.5
|
| 180 |
+
},
|
| 181 |
+
{
|
| 182 |
+
"args": {
|
| 183 |
+
"cache_event_time": 1750251842521445359,
|
| 184 |
+
"cache_state": "hit",
|
| 185 |
+
"compile_id": "0/0",
|
| 186 |
+
"components": [
|
| 187 |
+
"[b6z7ijvsnbtjurvqwdotlb6qtuyjsz4krtpkqj5thbq3fhqsbhp] gm: <lambda>()\n\n\n\ndef forward(self, arg0_1, arg1_1, arg2_1):\n scaled_fake_quantize = torch.ops.quark.scaled_fake_quantize.default('int4', arg0_1, arg1_1, arg2_1, 0, 0, 0.0, 15.0, 0, 'per_channel', 'haha'); arg0_1 = arg1_1 = arg2_1 = None\n return (scaled_fake_quantize,)\n \n# To see more debug info, please use `graph_module.print_readable()`",
|
| 188 |
+
"[nef3d47wx7hdxcyvwgucihijvag3qlbodqmms7dktjkxqgk4gux] example_inputs[0]: TensorMetadata(dtype=torch.float32, shape=torch.Size([4096, 8192]), stride=(8192, 1), device=device(type='cuda', index=0), layout=torch.strided, memory_format=torch.contiguous_format, storage_offset=0, storage_bytes=None, requires_grad=False, is_quantized=False, is_conj=False, is_neg=False, is_inference=False, is_sparse=False, is_coalesced=None, dense_dim=None, sparse_dim=None)",
|
| 189 |
+
"[7eps4cy57l62xkqx7rnf6ttfsuweegaqsqravzj2x5h4v6fbtod] example_inputs[1]: TensorMetadata(dtype=torch.float32, shape=torch.Size([4096]), stride=(1,), device=device(type='cuda', index=0), layout=torch.strided, memory_format=torch.contiguous_format, storage_offset=0, storage_bytes=None, requires_grad=False, is_quantized=False, is_conj=False, is_neg=False, is_inference=False, is_sparse=False, is_coalesced=None, dense_dim=None, sparse_dim=None)",
|
| 190 |
+
"[dpovg5nw4n7fkaetfrkwcqepypqcssr7fzpd75svn53n4xjxfow] example_inputs[2]: TensorMetadata(dtype=torch.int32, shape=torch.Size([4096]), stride=(1,), device=device(type='cuda', index=0), layout=torch.strided, memory_format=torch.contiguous_format, storage_offset=0, storage_bytes=None, requires_grad=False, is_quantized=False, is_conj=False, is_neg=False, is_inference=False, is_sparse=False, is_coalesced=None, dense_dim=None, sparse_dim=None)",
|
| 191 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] cache_key_tag: ",
|
| 192 |
+
"[lmglpn4zi7vob56n34r2j2rk7flv5xfgrcvmo7xcpirqsitygqx] fx_kwargs[boxed_forward_device_index]: BoxedDeviceIndex(value=None)",
|
| 193 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] fx_kwargs[cpp_wrapper]: False",
|
| 194 |
+
"[xq2hdkbfkbcuye6rgtypayrkhqf4cntij2dsd24rei3lsknakkf] fx_kwargs[cudagraphs]: BoxedBool(value=False)",
|
| 195 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] fx_kwargs[extern_node_serializer]: None",
|
| 196 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] fx_kwargs[is_backward]: False",
|
| 197 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] fx_kwargs[is_inference]: True",
|
| 198 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] fx_kwargs[layout_opt]: None",
|
| 199 |
+
"[h25wqx6vliw4j5rtzzbv6latydxyei3deyg6v7wzvnzryfktuki] fx_kwargs[static_input_idxs]: []",
|
| 200 |
+
"[vrl5ktomgtzox5xucd3np6vug3vyj6hwwzahqijuwpmamlv7ohi] inputs_to_check[0]: 0",
|
| 201 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inputs_to_check[1]: 1",
|
| 202 |
+
"[pr5nr4a7dthirgd2ljo3d2xakc63ywxugusu6mkmr6gmpeliyib] inputs_to_check[2]: 2",
|
| 203 |
+
"[du4vyrfyozrfxcf6kk6ma7oqwatapifazeelfsawmsiu6gjdtxp] deterministic_algorithms_settings: (False, False, True)",
|
| 204 |
+
"[qiptf2633zubseuei4bkisoq3not35l6lud6p23p4qmcsxiw2uq] cuda_matmul_settings: (False, True, True)",
|
| 205 |
+
"[ol6sj5vrtmgqd5cnfjbun7wbukfn7jyrtpkapnhmsysjdypit4i] torch_version: <bytes>",
|
| 206 |
+
"[rlwghyno43ot2zz35l3xlcrrh3arqenri6t5nsopt3t3q333zgy] system_info[device]: {'name': 'gfx942:sramecc+:xnack-'}",
|
| 207 |
+
"[njkbnmcun3rnt2yz2lgf57oprgdbjzlkadbcfoy57sir5fnskzg] system_info[version]: {'triton': '3.3.02e234c1d93a7cae949341b60b8567f825914128ed598e1d846c8bc19a9d65ad8-364a7d1dd5f29867a741138f83c5b453259e240a5d51f364f24f7196cedbf442-2e234c1d93a7cae949341b60b8567f825914128ed598e1d846c8bc19a9d65ad8-23d635e690d670bf61798e1259674b78c0ed5ba222ab6a455f329f27a758fc2d-e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855-ca6686d24a6f780b8449b43d419d11c978ebd00ab87a5fc6e57198a2027680d0-00deb4ba92653e089ad09c2f67cbc85602c84cd3ee2347ddcfcccc2081cfa45e-e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855-78995dd40c4e54964f62cdc6d47e66f6d9df8b55b172ad7eb99235f27999c840-f7c26e8ffdaf8cd2491de04217d32827b1a4f859f7f93ea56e26590c9f5e071a-a5b982237b29a230519ad566660a5912ae9d31da0dd6388465f3a1043b12ece7-6e4a7df0c1f6cb799f488ee1d6efd3df754fc18aac6e7209923bb022c36c7c4e-f983f9d6d6f987af520297c8fe3185601ae8f7d60bacab880ac9326bdfee1f67-5d15c5bebef8d7aa51b21fd187e5faa95eba4a213254355bc69e0648013599f7-26a8aeaf21e759191f173b578316e243ad970387442a1b238481c6a1b2eecdc4-bd364752852b76a0b75a9d93ecbc239781b730aa75021445a02d795aa8d38f6a-72bc1771d8b160fbafcd5390d1ee6cb72440c10ad4834451465a9e93b42f5d1c-7b506c955ee5646862dae548968e6523d75c37ad4750c214d9ab0f6918ecc88a-89e4844782de5fdff4868ac2846514570a6e280a6b92e91af2e180904043c833-115ada51f797cd098ddc5e4b95e8369a885571b15639694b6801f59e46eab55e-0e48b5e1e95136642ccfe62dc3d0a739a2c20a7b5ee13e9c23c6cecd68cdeb70-b616015f724e553348f5b019f7324dec130f7bbaf984d43300fa69c7c2fdda2f-54fe722cbe379a55695ab9478e73d344377cf5e9d6e055aff7cd03bf6fff1b2a-10285555cd515e21ca54714fc8eb9c173cca6b092b5e951a17ae5eee28ed2707-f2d4e73182e68eddc6237577b2158b7d8498ccb3c50642b9c74c55d3f4be3943', 'hip': '6.3.42131-fa1d09cbd'}",
|
| 208 |
+
"[3qefpuc3yyxaxf25vrqt6skezzayzydwq2o6i2xf2qdyioam5zw] system_info[hash]: 6e7af1eb52fca9b11dcfccdeb7b2a74263a0c6d2c07fe2b7f2c2003a4663609b",
|
| 209 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[TYPE_CHECKING]: False",
|
| 210 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[inplace_padding]: True",
|
| 211 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[can_inplace_pad_graph_input]: False",
|
| 212 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[enable_auto_functionalized_v2]: True",
|
| 213 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug]: False",
|
| 214 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[disable_progress]: True",
|
| 215 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[verbose_progress]: False",
|
| 216 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[fx_graph_cache]: True",
|
| 217 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[fx_graph_remote_cache]: None",
|
| 218 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[bundle_triton_into_fx_graph_cache]: True",
|
| 219 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[autotune_local_cache]: True",
|
| 220 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[autotune_remote_cache]: None",
|
| 221 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[bundled_autotune_remote_cache]: None",
|
| 222 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_disable_caches]: False",
|
| 223 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[sleep_sec_TESTING_ONLY]: None",
|
| 224 |
+
"[pikr7bbcoixfzftsazp5ggufhdklj24babfry77bl4nuvyrrcp4] inductor_config[custom_op_default_layout_constraint]: needs_fixed_stride_order",
|
| 225 |
+
"[pikr7bbcoixfzftsazp5ggufhdklj24babfry77bl4nuvyrrcp4] inductor_config[triton_kernel_default_layout_constraint]: needs_fixed_stride_order",
|
| 226 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp_wrapper]: False",
|
| 227 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[online_softmax]: True",
|
| 228 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[dce]: False",
|
| 229 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[static_weight_shapes]: True",
|
| 230 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[size_asserts]: True",
|
| 231 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[nan_asserts]: False",
|
| 232 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[scalar_asserts]: True",
|
| 233 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[pick_loop_orders]: True",
|
| 234 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[inplace_buffers]: True",
|
| 235 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[allow_buffer_reuse]: True",
|
| 236 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[memory_planning]: False",
|
| 237 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[use_fast_math]: False",
|
| 238 |
+
"[x75won4jmsgeb63pcvwr2y4eteyzzdhmf5rv6xhjppie4hx2yu5] inductor_config[memory_pool]: intermediates",
|
| 239 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[benchmark_harness]: True",
|
| 240 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[epilogue_fusion]: True",
|
| 241 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[prologue_fusion]: True",
|
| 242 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[epilogue_fusion_first]: False",
|
| 243 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[pattern_matcher]: True",
|
| 244 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[b2b_gemm_pass]: False",
|
| 245 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[joint_custom_pre_pass]: None",
|
| 246 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[joint_custom_post_pass]: None",
|
| 247 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[pre_grad_custom_pass]: None",
|
| 248 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[split_cat_fx_passes]: True",
|
| 249 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[efficient_conv_bn_eval_fx_passes]: False",
|
| 250 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[is_predispatch]: False",
|
| 251 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[group_fusion]: False",
|
| 252 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[batch_fusion]: True",
|
| 253 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[pre_grad_fusion_options]: {}",
|
| 254 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[post_grad_fusion_options]: {}",
|
| 255 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[reorder_for_locality]: True",
|
| 256 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[dynamic_scale_rblock]: True",
|
| 257 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_fuse_int_mm_with_mul]: False",
|
| 258 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[use_mixed_mm]: True",
|
| 259 |
+
"[zwmmbkdkarexuhbigurz5lfnhx64tht7fznecjkrvznh6rzivbv] inductor_config[fx_passes_numeric_check]: {'pre_grad': False, 'precision': 0.0001, 'num_iterations': 1, 'requires_optimizer': True}",
|
| 260 |
+
"[v2td5s4lnsvyxvaevy4chx6kc5h3mm2axazbgwimqule5zrzao7] inductor_config[mixed_mm_choice]: heuristic",
|
| 261 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[reorder_for_compute_comm_overlap]: False",
|
| 262 |
+
"[ssupi7bu3rrhdpg2jyegzncu3kg3nnhklyliqvutaxgs7y7k3dx] inductor_config[reorder_for_compute_comm_overlap_passes]: ['reorder_compute_for_overlap', 'sink_waits', 'raise_comms']",
|
| 263 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[reorder_for_peak_memory]: True",
|
| 264 |
+
"[lxxtoqhcoepwfokeiibd575gnxo3uzwiv4hmpomlwkpzqz3qzsh] inductor_config[estimate_op_runtime]: default",
|
| 265 |
+
"[yezuzjtg4h3jjur4jwtwiehbyixa7eonq4tqsqmwqve2lvvmrem] inductor_config[intra_node_bw]: 300",
|
| 266 |
+
"[5fxczt3ciyxitdhizb7sfsgn7fhpczcqsngttnt5ot2wyctk7co] inductor_config[inter_node_bw]: 25",
|
| 267 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[use_experimental_benchmarker]: True",
|
| 268 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[max_autotune]: True",
|
| 269 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[max_autotune_pointwise]: False",
|
| 270 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[max_autotune_gemm]: False",
|
| 271 |
+
"[j6c55jha5r2sdys2rwq7uqhtleea5dgjcye7nicfgft36v7xfvp] inductor_config[autotune_num_choices_displayed]: 10",
|
| 272 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[graph_partition]: False",
|
| 273 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_same_precision]: False",
|
| 274 |
+
"[2y7luesktjrque3nr7qtxnum2mkbeegzdrsvkm3rvdlhqboajhx] inductor_config[max_autotune_gemm_backends]: ATEN,TRITON,CPP",
|
| 275 |
+
"[uqlsbif4zxd75vt522p52txyuguieipi2lwz5g5awt56lccqk7s] inductor_config[max_autotune_conv_backends]: ATEN,TRITON",
|
| 276 |
+
"[jvchmi66fvqzlemhr5fcqorz5trfdtdalzfagtj2aolmimwqhdq] inductor_config[max_autotune_gemm_search_space]: DEFAULT",
|
| 277 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[autotune_fallback_to_aten]: True",
|
| 278 |
+
"[wft6ljqsfr3x4m7fa5zuyb7cwknky4irrxz4bjr6uzr2yiopxqj] inductor_config[unbacked_symint_fallback]: 8192",
|
| 279 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[search_autotune_cache]: False",
|
| 280 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[save_args]: False",
|
| 281 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[autotune_in_subproc]: False",
|
| 282 |
+
"[iglov24t7x5ruci344aer2tm6nqshi4veuw4wxlssxtu46cx76m] inductor_config[max_autotune_subproc_result_timeout_seconds]: 60.0",
|
| 283 |
+
"[bh33ranllcgilhgmgr3qvygzxjm6isq5iexnfm3zx6fnr2zwlp2] inductor_config[max_autotune_subproc_graceful_timeout_seconds]: 1.0",
|
| 284 |
+
"[pwoh5aypf4fxbntdvwt67rppxorqos6xr3w7qzeun6kblbfg2ga] inductor_config[max_autotune_subproc_terminate_timeout_seconds]: 2.0",
|
| 285 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[autotune_multi_device]: False",
|
| 286 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[coordinate_descent_tuning]: True",
|
| 287 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[coordinate_descent_check_all_directions]: False",
|
| 288 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[coordinate_descent_search_radius]: 1",
|
| 289 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[autoheuristic_collect]: ",
|
| 290 |
+
"[jwbrgxes7vjqumngs5hyj6gn5nytv2whnppnzngvaagfmawhkkd] inductor_config[autoheuristic_use]: mixed_mm",
|
| 291 |
+
"[jvchmi66fvqzlemhr5fcqorz5trfdtdalzfagtj2aolmimwqhdq] inductor_config[autoheuristic_log_path]: DEFAULT",
|
| 292 |
+
"[ngkkx5e6z7erl6da23zb2cmsctz4yvaqyameyg5hbqln4wrhh7x] inductor_config[layout_opt_default]: 0",
|
| 293 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[layout_optimization]: False",
|
| 294 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_layout_optimization]: False",
|
| 295 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[keep_output_stride]: True",
|
| 296 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[warn_mix_layout]: False",
|
| 297 |
+
"[lkkae3meylaixfif4thncru4hjqeaislawjoghffrbwuscaagei] inductor_config[realize_reads_threshold]: 4",
|
| 298 |
+
"[rr5m5hsocoyodldz7vcvaizdwvm2rt34evmqdxvng7wz3tufvo6] inductor_config[realize_opcount_threshold]: 30",
|
| 299 |
+
"[yttmfmxblgcbsvbokguzowcorrcxz5uunxtcvsbe6nijgcx45he] inductor_config[realize_acc_reads_threshold]: 8",
|
| 300 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[fallback_random]: False",
|
| 301 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[implicit_fallbacks]: True",
|
| 302 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aggressive_fusion]: False",
|
| 303 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug_fusion]: False",
|
| 304 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[benchmark_fusion]: False",
|
| 305 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[enabled_metric_tables]: ",
|
| 306 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[loop_ordering_after_fusion]: False",
|
| 307 |
+
"[j6c55jha5r2sdys2rwq7uqhtleea5dgjcye7nicfgft36v7xfvp] inductor_config[score_fusion_memory_threshold]: 10",
|
| 308 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[benchmark_epilogue_fusion]: True",
|
| 309 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[max_epilogue_benchmarked_choices]: 1",
|
| 310 |
+
"[jykiys6ynafs3zdylwa5ggq6j655mxeh42d6mtdi22gffkrmiac] inductor_config[max_fusion_size]: 64",
|
| 311 |
+
"[yttmfmxblgcbsvbokguzowcorrcxz5uunxtcvsbe6nijgcx45he] inductor_config[max_pointwise_cat_inputs]: 8",
|
| 312 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_pointwise_cat]: False",
|
| 313 |
+
"[yttmfmxblgcbsvbokguzowcorrcxz5uunxtcvsbe6nijgcx45he] inductor_config[unroll_reductions_threshold]: 8",
|
| 314 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[comment_origin]: False",
|
| 315 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[conv_1x1_as_mm]: False",
|
| 316 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[split_reductions]: True",
|
| 317 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[benchmark_kernel]: False",
|
| 318 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[constant_and_index_propagation]: True",
|
| 319 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[always_keep_tensor_constants]: False",
|
| 320 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[assert_indirect_indexing]: True",
|
| 321 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[compute_all_bounds]: False",
|
| 322 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[combo_kernels]: False",
|
| 323 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[benchmark_combo_kernel]: False",
|
| 324 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[combo_kernels_autotune]: 1",
|
| 325 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[combo_kernel_allow_mixed_sizes]: 1",
|
| 326 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[combo_kernel_foreach_dynamic_shapes]: False",
|
| 327 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[joint_graph_constant_folding]: True",
|
| 328 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug_index_asserts]: False",
|
| 329 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[emulate_precision_casts]: False",
|
| 330 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[is_nightly_or_source]: False",
|
| 331 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[developer_warnings]: False",
|
| 332 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[optimize_scatter_upon_const_tensor]: True",
|
| 333 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[add_pre_grad_passes]: None",
|
| 334 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[remove_pre_grad_passes]: None",
|
| 335 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[global_cache_dir]: None",
|
| 336 |
+
"[j6c55jha5r2sdys2rwq7uqhtleea5dgjcye7nicfgft36v7xfvp] inductor_config[kernel_name_max_ops]: 10",
|
| 337 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[shape_padding]: True",
|
| 338 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[comprehensive_padding]: True",
|
| 339 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[pad_channels_last]: False",
|
| 340 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[disable_padding_cpu]: True",
|
| 341 |
+
"[ljdqgtysl3vdf7j6attlz5gmjg2ncihnveojfyubosplmkrjgra] inductor_config[padding_alignment_bytes]: 128",
|
| 342 |
+
"[dnnw5ks3yxrp7mwvihb2hh4tqx35ye637xt33x64kw4fvz2nyzg] inductor_config[padding_stride_threshold]: 1024",
|
| 343 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[pad_outputs]: False",
|
| 344 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[bw_outputs_user_visible]: True",
|
| 345 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_shape_pad]: False",
|
| 346 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[permute_fusion]: False",
|
| 347 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[profiler_mark_wrapper_call]: False",
|
| 348 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[generate_intermediate_hooks]: False",
|
| 349 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug_ir_traceback]: False",
|
| 350 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[profile_bandwidth]: False",
|
| 351 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[profile_bandwidth_regex]: ",
|
| 352 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[profile_bandwidth_output]: None",
|
| 353 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[profile_bandwidth_with_do_bench_using_profiling]: False",
|
| 354 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[disable_cpp_codegen]: False",
|
| 355 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[freezing]: False",
|
| 356 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[freezing_discard_parameters]: False",
|
| 357 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[decompose_mem_bound_mm]: False",
|
| 358 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[assume_aligned_inputs]: False",
|
| 359 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[unsafe_ignore_unsupported_triton_autotune_args]: False",
|
| 360 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[check_stack_no_cycles_TESTING_ONLY]: False",
|
| 361 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[enable_linear_binary_folding]: False",
|
| 362 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[annotate_training]: False",
|
| 363 |
+
"[sz3im5ogc6asp7g4uqocnovype63tkdexzfrniv6hn2oank3biu] inductor_config[cpp.threads]: -1",
|
| 364 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.no_redundant_loops]: True",
|
| 365 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.dynamic_threads]: False",
|
| 366 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.simdlen]: None",
|
| 367 |
+
"[g7rrnbg5yonzux3cfj5ovre5lob3ayda7qcfpxjvtwmiz4uicii] inductor_config[cpp.min_chunk_size]: 4096",
|
| 368 |
+
"[c7zj4qytmety6keurs3hsh5wn7foxp3dqx4kym2ucszzcb2ngrf] inductor_config[cpp.cxx]: (None, 'g++')",
|
| 369 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_kernel_profile]: False",
|
| 370 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.weight_prepack]: True",
|
| 371 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.inject_relu_bug_TESTING_ONLY]: None",
|
| 372 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.inject_log1p_bug_TESTING_ONLY]: None",
|
| 373 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.vec_isa_ok]: None",
|
| 374 |
+
"[yrty22bseefglnysuoec4ji7j2rnaggdj3g33zzj7avogwfmgdw] inductor_config[cpp.descriptive_names]: original_aten",
|
| 375 |
+
"[ebt2ncs4f5y7dn7btzi76mnouepvzad474tmp5iju4wiuumjl4s] inductor_config[cpp.max_horizontal_fusion_size]: 16",
|
| 376 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.fallback_scatter_reduce_sum]: True",
|
| 377 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_unsafe_math_opt_flag]: False",
|
| 378 |
+
"[ijs44lspkinjvhcs7uff7n3noc53jvsp4yfljjh22mafhb7khxe] inductor_config[cpp.enable_floating_point_contract_flag]: off",
|
| 379 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.enable_tiling_heuristics]: True",
|
| 380 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_grouped_gemm_template]: False",
|
| 381 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[cpp.gemm_max_k_slices]: 1",
|
| 382 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.gemm_cache_blocking]: None",
|
| 383 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.gemm_thread_factors]: None",
|
| 384 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.enable_loop_tail_vec]: True",
|
| 385 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_concat_linear]: False",
|
| 386 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cudagraphs]: False",
|
| 387 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.cudagraph_trees]: True",
|
| 388 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cudagraph_skip_dynamic_graphs]: False",
|
| 389 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.slow_path_cudagraph_asserts]: True",
|
| 390 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cudagraph_trees_history_recording]: False",
|
| 391 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.cudagraph_support_input_mutation]: True",
|
| 392 |
+
"[ljdqgtysl3vdf7j6attlz5gmjg2ncihnveojfyubosplmkrjgra] inductor_config[triton.cudagraph_unexpected_rerecord_limit]: 128",
|
| 393 |
+
"[tuax46wac7rfv2trf5gcps6vleo3cq44lbnrdxtprvo3ljjaddj] inductor_config[triton.cudagraph_dynamic_shape_warn_limit]: 50",
|
| 394 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.force_cudagraph_sync]: False",
|
| 395 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.force_cudagraphs_warmup]: False",
|
| 396 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.fast_path_cudagraph_asserts]: False",
|
| 397 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.skip_cudagraph_warmup]: False",
|
| 398 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.debug_sync_graph]: False",
|
| 399 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.debug_sync_kernel]: False",
|
| 400 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.dense_indexing]: False",
|
| 401 |
+
"[pr5nr4a7dthirgd2ljo3d2xakc63ywxugusu6mkmr6gmpeliyib] inductor_config[triton.max_tiles]: 2",
|
| 402 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.prefer_nd_tiling]: False",
|
| 403 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.autotune_pointwise]: True",
|
| 404 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.autotune_cublasLt]: True",
|
| 405 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[triton.autotune_at_compile_time]: None",
|
| 406 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.tile_reductions]: False",
|
| 407 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.tiling_prevents_pointwise_fusion]: True",
|
| 408 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.tiling_prevents_reduction_fusion]: True",
|
| 409 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.unique_kernel_names]: True",
|
| 410 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.unique_user_kernel_names]: False",
|
| 411 |
+
"[yrty22bseefglnysuoec4ji7j2rnaggdj3g33zzj7avogwfmgdw] inductor_config[triton.descriptive_names]: original_aten",
|
| 412 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.persistent_reductions]: True",
|
| 413 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cooperative_reductions]: False",
|
| 414 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.force_cooperative_reductions]: False",
|
| 415 |
+
"[vrl5ktomgtzox5xucd3np6vug3vyj6hwwzahqijuwpmamlv7ohi] inductor_config[triton.multi_kernel]: 0",
|
| 416 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.divisible_by_16]: True",
|
| 417 |
+
"[fv6slhtedtydps5s5u2etitscliblzcidyitqf7krsv4e23fzk6] inductor_config[triton.min_split_scan_rblock]: 256",
|
| 418 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.store_cubin]: False",
|
| 419 |
+
"[ebt2ncs4f5y7dn7btzi76mnouepvzad474tmp5iju4wiuumjl4s] inductor_config[triton.spill_threshold]: 16",
|
| 420 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.use_block_ptr]: False",
|
| 421 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[triton.inject_relu_bug_TESTING_ONLY]: None",
|
| 422 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.codegen_upcast_to_fp32]: True",
|
| 423 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.enable_persistent_tma_matmul]: False",
|
| 424 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.skip_l1_cache]: False",
|
| 425 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.disallow_failing_autotune_kernels_TESTING_ONLY]: False",
|
| 426 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[aot_inductor.output_path]: ",
|
| 427 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.debug_compile]: False",
|
| 428 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.compile_wrapper_with_O0]: False",
|
| 429 |
+
"[ngkkx5e6z7erl6da23zb2cmsctz4yvaqyameyg5hbqln4wrhh7x] inductor_config[aot_inductor.debug_intermediate_value_printer]: 0",
|
| 430 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[aot_inductor.filtered_kernel_names]: None",
|
| 431 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[aot_inductor.serialized_in_spec]: ",
|
| 432 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[aot_inductor.serialized_out_spec]: ",
|
| 433 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.use_runtime_constant_folding]: False",
|
| 434 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.force_mmap_weights]: False",
|
| 435 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.package]: False",
|
| 436 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.package_cpp_only]: False",
|
| 437 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[aot_inductor.metadata]: {}",
|
| 438 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[aot_inductor.raise_error_on_ignored_optimization]: True",
|
| 439 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.dump_aoti_minifier]: False",
|
| 440 |
+
"[pr5nr4a7dthirgd2ljo3d2xakc63ywxugusu6mkmr6gmpeliyib] inductor_config[aot_inductor.repro_level]: 2",
|
| 441 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[aot_inductor.presets]: {}",
|
| 442 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.allow_stack_allocation]: False",
|
| 443 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.use_minimal_arrayref_interface]: False",
|
| 444 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[aot_inductor.package_constants_in_so]: True",
|
| 445 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.arch]: None",
|
| 446 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.version]: None",
|
| 447 |
+
"[tvyftmtdmezlejo2xllu7awzv4pzc4vm4fub4b3gpl5jptjkosi] inductor_config[cuda.compile_opt_level]: -O1",
|
| 448 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.enable_cuda_lto]: False",
|
| 449 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.enable_ptxas_info]: False",
|
| 450 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.enable_debug_info]: False",
|
| 451 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.use_fast_math]: False",
|
| 452 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cutlass_max_profiling_configs]: None",
|
| 453 |
+
"[xaicuyqjstadzph6cgvxowlzizkts6kzmfupsnbyaorxh37cppz] inductor_config[cuda.cutlass_max_profiling_swizzle_options]: [1, 2, 4]",
|
| 454 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cuda_cxx]: None",
|
| 455 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[cuda.cutlass_backend_min_gemm_size]: 1",
|
| 456 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.generate_test_runner]: False",
|
| 457 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cutlass_op_allowlist_regex]: None",
|
| 458 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cutlass_op_denylist_regex]: None",
|
| 459 |
+
"[ngkkx5e6z7erl6da23zb2cmsctz4yvaqyameyg5hbqln4wrhh7x] inductor_config[cuda.cutlass_instantiation_level]: 0",
|
| 460 |
+
"[h25wqx6vliw4j5rtzzbv6latydxyei3deyg6v7wzvnzryfktuki] inductor_config[rocm.arch]: []",
|
| 461 |
+
"[3w3j4h2iiu3addwyb5alaeecz3so7teb23hp4d5n3b46w5n73ur] inductor_config[rocm.ck_supported_arch]: ['gfx90a', 'gfx942']",
|
| 462 |
+
"[klfqjprnpfhcdurgvuikvc4rpd5ynkpk77toousr5h3u5roty6p] inductor_config[rocm.compile_opt_level]: -O2",
|
| 463 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.is_debug]: False",
|
| 464 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.save_temps]: False",
|
| 465 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[rocm.use_fast_math]: True",
|
| 466 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[rocm.flush_denormals]: True",
|
| 467 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.print_kernel_resource_usage]: False",
|
| 468 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.rocm_home]: None",
|
| 469 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.ck_dir]: None",
|
| 470 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.generate_test_runner]: False",
|
| 471 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.n_max_profiling_configs]: None",
|
| 472 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.use_preselected_instances]: False",
|
| 473 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.kBatch_sweep]: None",
|
| 474 |
+
"[ebt2ncs4f5y7dn7btzi76mnouepvzad474tmp5iju4wiuumjl4s] inductor_config[rocm.split_k_threshold]: 16",
|
| 475 |
+
"[bsvfcwwoczx2rlkdz2eta6doujsymyihmi46hhwk6clrrvwcb6m] inductor_config[cpu_backend]: cpp",
|
| 476 |
+
"[caw4ly2z672k6kjfahoxwpajp5idhhtrpgf3ma2clylcp7c7aid] inductor_config[cuda_backend]: triton",
|
| 477 |
+
"[ljhgflgihidopsfsdcbqynv27nceykby3nutyd5jlcpq7n6e7l4] inductor_config[halide.cpu_target]: host",
|
| 478 |
+
"[wx7vmsmrdpk5ue2txlywp3lj3faqmdjphs5fgg2ehzsyno7uovg] inductor_config[halide.gpu_target]: host-cuda",
|
| 479 |
+
"[svgytlua5wcyeia7wq7e6zgh5tsueikrnzchmdmouvmkpfsc2zq] inductor_config[halide.scheduler_cuda]: Anderson2021",
|
| 480 |
+
"[k5ogk6345jvklsnu7g2njqstiz2g6pm5wmqpgg3kasrmuqwjvl6] inductor_config[halide.scheduler_cpu]: Adams2019",
|
| 481 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[halide.asserts]: False",
|
| 482 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[halide.debug]: False",
|
| 483 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[halide.scan_kernels]: False",
|
| 484 |
+
"[h25wqx6vliw4j5rtzzbv6latydxyei3deyg6v7wzvnzryfktuki] inductor_config[external_matmul]: []",
|
| 485 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[test_configs.force_extern_kernel_in_multi_template]: False",
|
| 486 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[test_configs.max_mm_configs]: None",
|
| 487 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[test_configs.runtime_triton_dtype_assert]: False",
|
| 488 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[test_configs.autotune_choice_name_regex]: None",
|
| 489 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[test_configs.autotune_choice_desc_regex]: None",
|
| 490 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[test_configs.graphsafe_rng_func_ignores_fallback_random]: False",
|
| 491 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] post_grad_custom_pre_pass: None",
|
| 492 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] post_grad_custom_post_pass: None"
|
| 493 |
+
],
|
| 494 |
+
"key": "fr57fwh6rfk65wtgsmaeq6p7domzwaxezpig6cnku7tl6zrhoujz",
|
| 495 |
+
"time_saved_ns": 427407491
|
| 496 |
+
},
|
| 497 |
+
"cat": "dynamo_timed",
|
| 498 |
+
"name": "fx_graph_cache_hit",
|
| 499 |
+
"ph": "i",
|
| 500 |
+
"pid": 0,
|
| 501 |
+
"s": "p",
|
| 502 |
+
"tid": 0,
|
| 503 |
+
"ts": 1750251842118276.5
|
| 504 |
+
},
|
| 505 |
+
{
|
| 506 |
+
"args": {
|
| 507 |
+
"cache_bypass_reason": null,
|
| 508 |
+
"cache_event_time": 1750251842118276381,
|
| 509 |
+
"cache_state": "hit",
|
| 510 |
+
"compile_id": "0/0",
|
| 511 |
+
"components": [
|
| 512 |
+
"[b6z7ijvsnbtjurvqwdotlb6qtuyjsz4krtpkqj5thbq3fhqsbhp] gm: <lambda>()\n\n\n\ndef forward(self, arg0_1, arg1_1, arg2_1):\n scaled_fake_quantize = torch.ops.quark.scaled_fake_quantize.default('int4', arg0_1, arg1_1, arg2_1, 0, 0, 0.0, 15.0, 0, 'per_channel', 'haha'); arg0_1 = arg1_1 = arg2_1 = None\n return (scaled_fake_quantize,)\n \n# To see more debug info, please use `graph_module.print_readable()`",
|
| 513 |
+
"[nef3d47wx7hdxcyvwgucihijvag3qlbodqmms7dktjkxqgk4gux] example_inputs[0]: TensorMetadata(dtype=torch.float32, shape=torch.Size([4096, 8192]), stride=(8192, 1), device=device(type='cuda', index=0), layout=torch.strided, memory_format=torch.contiguous_format, storage_offset=0, storage_bytes=None, requires_grad=False, is_quantized=False, is_conj=False, is_neg=False, is_inference=False, is_sparse=False, is_coalesced=None, dense_dim=None, sparse_dim=None)",
|
| 514 |
+
"[7eps4cy57l62xkqx7rnf6ttfsuweegaqsqravzj2x5h4v6fbtod] example_inputs[1]: TensorMetadata(dtype=torch.float32, shape=torch.Size([4096]), stride=(1,), device=device(type='cuda', index=0), layout=torch.strided, memory_format=torch.contiguous_format, storage_offset=0, storage_bytes=None, requires_grad=False, is_quantized=False, is_conj=False, is_neg=False, is_inference=False, is_sparse=False, is_coalesced=None, dense_dim=None, sparse_dim=None)",
|
| 515 |
+
"[dpovg5nw4n7fkaetfrkwcqepypqcssr7fzpd75svn53n4xjxfow] example_inputs[2]: TensorMetadata(dtype=torch.int32, shape=torch.Size([4096]), stride=(1,), device=device(type='cuda', index=0), layout=torch.strided, memory_format=torch.contiguous_format, storage_offset=0, storage_bytes=None, requires_grad=False, is_quantized=False, is_conj=False, is_neg=False, is_inference=False, is_sparse=False, is_coalesced=None, dense_dim=None, sparse_dim=None)",
|
| 516 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] cache_key_tag: ",
|
| 517 |
+
"[lmglpn4zi7vob56n34r2j2rk7flv5xfgrcvmo7xcpirqsitygqx] fx_kwargs[boxed_forward_device_index]: BoxedDeviceIndex(value=None)",
|
| 518 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] fx_kwargs[cpp_wrapper]: False",
|
| 519 |
+
"[xq2hdkbfkbcuye6rgtypayrkhqf4cntij2dsd24rei3lsknakkf] fx_kwargs[cudagraphs]: BoxedBool(value=False)",
|
| 520 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] fx_kwargs[extern_node_serializer]: None",
|
| 521 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] fx_kwargs[is_backward]: False",
|
| 522 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] fx_kwargs[is_inference]: True",
|
| 523 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] fx_kwargs[layout_opt]: None",
|
| 524 |
+
"[h25wqx6vliw4j5rtzzbv6latydxyei3deyg6v7wzvnzryfktuki] fx_kwargs[static_input_idxs]: []",
|
| 525 |
+
"[vrl5ktomgtzox5xucd3np6vug3vyj6hwwzahqijuwpmamlv7ohi] inputs_to_check[0]: 0",
|
| 526 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inputs_to_check[1]: 1",
|
| 527 |
+
"[pr5nr4a7dthirgd2ljo3d2xakc63ywxugusu6mkmr6gmpeliyib] inputs_to_check[2]: 2",
|
| 528 |
+
"[du4vyrfyozrfxcf6kk6ma7oqwatapifazeelfsawmsiu6gjdtxp] deterministic_algorithms_settings: (False, False, True)",
|
| 529 |
+
"[qiptf2633zubseuei4bkisoq3not35l6lud6p23p4qmcsxiw2uq] cuda_matmul_settings: (False, True, True)",
|
| 530 |
+
"[ol6sj5vrtmgqd5cnfjbun7wbukfn7jyrtpkapnhmsysjdypit4i] torch_version: <bytes>",
|
| 531 |
+
"[rlwghyno43ot2zz35l3xlcrrh3arqenri6t5nsopt3t3q333zgy] system_info[device]: {'name': 'gfx942:sramecc+:xnack-'}",
|
| 532 |
+
"[njkbnmcun3rnt2yz2lgf57oprgdbjzlkadbcfoy57sir5fnskzg] system_info[version]: {'triton': '3.3.02e234c1d93a7cae949341b60b8567f825914128ed598e1d846c8bc19a9d65ad8-364a7d1dd5f29867a741138f83c5b453259e240a5d51f364f24f7196cedbf442-2e234c1d93a7cae949341b60b8567f825914128ed598e1d846c8bc19a9d65ad8-23d635e690d670bf61798e1259674b78c0ed5ba222ab6a455f329f27a758fc2d-e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855-ca6686d24a6f780b8449b43d419d11c978ebd00ab87a5fc6e57198a2027680d0-00deb4ba92653e089ad09c2f67cbc85602c84cd3ee2347ddcfcccc2081cfa45e-e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855-78995dd40c4e54964f62cdc6d47e66f6d9df8b55b172ad7eb99235f27999c840-f7c26e8ffdaf8cd2491de04217d32827b1a4f859f7f93ea56e26590c9f5e071a-a5b982237b29a230519ad566660a5912ae9d31da0dd6388465f3a1043b12ece7-6e4a7df0c1f6cb799f488ee1d6efd3df754fc18aac6e7209923bb022c36c7c4e-f983f9d6d6f987af520297c8fe3185601ae8f7d60bacab880ac9326bdfee1f67-5d15c5bebef8d7aa51b21fd187e5faa95eba4a213254355bc69e0648013599f7-26a8aeaf21e759191f173b578316e243ad970387442a1b238481c6a1b2eecdc4-bd364752852b76a0b75a9d93ecbc239781b730aa75021445a02d795aa8d38f6a-72bc1771d8b160fbafcd5390d1ee6cb72440c10ad4834451465a9e93b42f5d1c-7b506c955ee5646862dae548968e6523d75c37ad4750c214d9ab0f6918ecc88a-89e4844782de5fdff4868ac2846514570a6e280a6b92e91af2e180904043c833-115ada51f797cd098ddc5e4b95e8369a885571b15639694b6801f59e46eab55e-0e48b5e1e95136642ccfe62dc3d0a739a2c20a7b5ee13e9c23c6cecd68cdeb70-b616015f724e553348f5b019f7324dec130f7bbaf984d43300fa69c7c2fdda2f-54fe722cbe379a55695ab9478e73d344377cf5e9d6e055aff7cd03bf6fff1b2a-10285555cd515e21ca54714fc8eb9c173cca6b092b5e951a17ae5eee28ed2707-f2d4e73182e68eddc6237577b2158b7d8498ccb3c50642b9c74c55d3f4be3943', 'hip': '6.3.42131-fa1d09cbd'}",
|
| 533 |
+
"[3qefpuc3yyxaxf25vrqt6skezzayzydwq2o6i2xf2qdyioam5zw] system_info[hash]: 6e7af1eb52fca9b11dcfccdeb7b2a74263a0c6d2c07fe2b7f2c2003a4663609b",
|
| 534 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[TYPE_CHECKING]: False",
|
| 535 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[inplace_padding]: True",
|
| 536 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[can_inplace_pad_graph_input]: False",
|
| 537 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[enable_auto_functionalized_v2]: True",
|
| 538 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug]: False",
|
| 539 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[disable_progress]: True",
|
| 540 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[verbose_progress]: False",
|
| 541 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[fx_graph_cache]: True",
|
| 542 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[fx_graph_remote_cache]: None",
|
| 543 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[bundle_triton_into_fx_graph_cache]: True",
|
| 544 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[autotune_local_cache]: True",
|
| 545 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[autotune_remote_cache]: None",
|
| 546 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[bundled_autotune_remote_cache]: None",
|
| 547 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_disable_caches]: False",
|
| 548 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[sleep_sec_TESTING_ONLY]: None",
|
| 549 |
+
"[pikr7bbcoixfzftsazp5ggufhdklj24babfry77bl4nuvyrrcp4] inductor_config[custom_op_default_layout_constraint]: needs_fixed_stride_order",
|
| 550 |
+
"[pikr7bbcoixfzftsazp5ggufhdklj24babfry77bl4nuvyrrcp4] inductor_config[triton_kernel_default_layout_constraint]: needs_fixed_stride_order",
|
| 551 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp_wrapper]: False",
|
| 552 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[online_softmax]: True",
|
| 553 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[dce]: False",
|
| 554 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[static_weight_shapes]: True",
|
| 555 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[size_asserts]: True",
|
| 556 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[nan_asserts]: False",
|
| 557 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[scalar_asserts]: True",
|
| 558 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[pick_loop_orders]: True",
|
| 559 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[inplace_buffers]: True",
|
| 560 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[allow_buffer_reuse]: True",
|
| 561 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[memory_planning]: False",
|
| 562 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[use_fast_math]: False",
|
| 563 |
+
"[x75won4jmsgeb63pcvwr2y4eteyzzdhmf5rv6xhjppie4hx2yu5] inductor_config[memory_pool]: intermediates",
|
| 564 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[benchmark_harness]: True",
|
| 565 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[epilogue_fusion]: True",
|
| 566 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[prologue_fusion]: True",
|
| 567 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[epilogue_fusion_first]: False",
|
| 568 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[pattern_matcher]: True",
|
| 569 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[b2b_gemm_pass]: False",
|
| 570 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[joint_custom_pre_pass]: None",
|
| 571 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[joint_custom_post_pass]: None",
|
| 572 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[pre_grad_custom_pass]: None",
|
| 573 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[split_cat_fx_passes]: True",
|
| 574 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[efficient_conv_bn_eval_fx_passes]: False",
|
| 575 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[is_predispatch]: False",
|
| 576 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[group_fusion]: False",
|
| 577 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[batch_fusion]: True",
|
| 578 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[pre_grad_fusion_options]: {}",
|
| 579 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[post_grad_fusion_options]: {}",
|
| 580 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[reorder_for_locality]: True",
|
| 581 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[dynamic_scale_rblock]: True",
|
| 582 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_fuse_int_mm_with_mul]: False",
|
| 583 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[use_mixed_mm]: True",
|
| 584 |
+
"[zwmmbkdkarexuhbigurz5lfnhx64tht7fznecjkrvznh6rzivbv] inductor_config[fx_passes_numeric_check]: {'pre_grad': False, 'precision': 0.0001, 'num_iterations': 1, 'requires_optimizer': True}",
|
| 585 |
+
"[v2td5s4lnsvyxvaevy4chx6kc5h3mm2axazbgwimqule5zrzao7] inductor_config[mixed_mm_choice]: heuristic",
|
| 586 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[reorder_for_compute_comm_overlap]: False",
|
| 587 |
+
"[ssupi7bu3rrhdpg2jyegzncu3kg3nnhklyliqvutaxgs7y7k3dx] inductor_config[reorder_for_compute_comm_overlap_passes]: ['reorder_compute_for_overlap', 'sink_waits', 'raise_comms']",
|
| 588 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[reorder_for_peak_memory]: True",
|
| 589 |
+
"[lxxtoqhcoepwfokeiibd575gnxo3uzwiv4hmpomlwkpzqz3qzsh] inductor_config[estimate_op_runtime]: default",
|
| 590 |
+
"[yezuzjtg4h3jjur4jwtwiehbyixa7eonq4tqsqmwqve2lvvmrem] inductor_config[intra_node_bw]: 300",
|
| 591 |
+
"[5fxczt3ciyxitdhizb7sfsgn7fhpczcqsngttnt5ot2wyctk7co] inductor_config[inter_node_bw]: 25",
|
| 592 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[use_experimental_benchmarker]: True",
|
| 593 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[max_autotune]: True",
|
| 594 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[max_autotune_pointwise]: False",
|
| 595 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[max_autotune_gemm]: False",
|
| 596 |
+
"[j6c55jha5r2sdys2rwq7uqhtleea5dgjcye7nicfgft36v7xfvp] inductor_config[autotune_num_choices_displayed]: 10",
|
| 597 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[graph_partition]: False",
|
| 598 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_same_precision]: False",
|
| 599 |
+
"[2y7luesktjrque3nr7qtxnum2mkbeegzdrsvkm3rvdlhqboajhx] inductor_config[max_autotune_gemm_backends]: ATEN,TRITON,CPP",
|
| 600 |
+
"[uqlsbif4zxd75vt522p52txyuguieipi2lwz5g5awt56lccqk7s] inductor_config[max_autotune_conv_backends]: ATEN,TRITON",
|
| 601 |
+
"[jvchmi66fvqzlemhr5fcqorz5trfdtdalzfagtj2aolmimwqhdq] inductor_config[max_autotune_gemm_search_space]: DEFAULT",
|
| 602 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[autotune_fallback_to_aten]: True",
|
| 603 |
+
"[wft6ljqsfr3x4m7fa5zuyb7cwknky4irrxz4bjr6uzr2yiopxqj] inductor_config[unbacked_symint_fallback]: 8192",
|
| 604 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[search_autotune_cache]: False",
|
| 605 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[save_args]: False",
|
| 606 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[autotune_in_subproc]: False",
|
| 607 |
+
"[iglov24t7x5ruci344aer2tm6nqshi4veuw4wxlssxtu46cx76m] inductor_config[max_autotune_subproc_result_timeout_seconds]: 60.0",
|
| 608 |
+
"[bh33ranllcgilhgmgr3qvygzxjm6isq5iexnfm3zx6fnr2zwlp2] inductor_config[max_autotune_subproc_graceful_timeout_seconds]: 1.0",
|
| 609 |
+
"[pwoh5aypf4fxbntdvwt67rppxorqos6xr3w7qzeun6kblbfg2ga] inductor_config[max_autotune_subproc_terminate_timeout_seconds]: 2.0",
|
| 610 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[autotune_multi_device]: False",
|
| 611 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[coordinate_descent_tuning]: True",
|
| 612 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[coordinate_descent_check_all_directions]: False",
|
| 613 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[coordinate_descent_search_radius]: 1",
|
| 614 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[autoheuristic_collect]: ",
|
| 615 |
+
"[jwbrgxes7vjqumngs5hyj6gn5nytv2whnppnzngvaagfmawhkkd] inductor_config[autoheuristic_use]: mixed_mm",
|
| 616 |
+
"[jvchmi66fvqzlemhr5fcqorz5trfdtdalzfagtj2aolmimwqhdq] inductor_config[autoheuristic_log_path]: DEFAULT",
|
| 617 |
+
"[ngkkx5e6z7erl6da23zb2cmsctz4yvaqyameyg5hbqln4wrhh7x] inductor_config[layout_opt_default]: 0",
|
| 618 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[layout_optimization]: False",
|
| 619 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_layout_optimization]: False",
|
| 620 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[keep_output_stride]: True",
|
| 621 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[warn_mix_layout]: False",
|
| 622 |
+
"[lkkae3meylaixfif4thncru4hjqeaislawjoghffrbwuscaagei] inductor_config[realize_reads_threshold]: 4",
|
| 623 |
+
"[rr5m5hsocoyodldz7vcvaizdwvm2rt34evmqdxvng7wz3tufvo6] inductor_config[realize_opcount_threshold]: 30",
|
| 624 |
+
"[yttmfmxblgcbsvbokguzowcorrcxz5uunxtcvsbe6nijgcx45he] inductor_config[realize_acc_reads_threshold]: 8",
|
| 625 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[fallback_random]: False",
|
| 626 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[implicit_fallbacks]: True",
|
| 627 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aggressive_fusion]: False",
|
| 628 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug_fusion]: False",
|
| 629 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[benchmark_fusion]: False",
|
| 630 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[enabled_metric_tables]: ",
|
| 631 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[loop_ordering_after_fusion]: False",
|
| 632 |
+
"[j6c55jha5r2sdys2rwq7uqhtleea5dgjcye7nicfgft36v7xfvp] inductor_config[score_fusion_memory_threshold]: 10",
|
| 633 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[benchmark_epilogue_fusion]: True",
|
| 634 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[max_epilogue_benchmarked_choices]: 1",
|
| 635 |
+
"[jykiys6ynafs3zdylwa5ggq6j655mxeh42d6mtdi22gffkrmiac] inductor_config[max_fusion_size]: 64",
|
| 636 |
+
"[yttmfmxblgcbsvbokguzowcorrcxz5uunxtcvsbe6nijgcx45he] inductor_config[max_pointwise_cat_inputs]: 8",
|
| 637 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_pointwise_cat]: False",
|
| 638 |
+
"[yttmfmxblgcbsvbokguzowcorrcxz5uunxtcvsbe6nijgcx45he] inductor_config[unroll_reductions_threshold]: 8",
|
| 639 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[comment_origin]: False",
|
| 640 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[conv_1x1_as_mm]: False",
|
| 641 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[split_reductions]: True",
|
| 642 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[benchmark_kernel]: False",
|
| 643 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[constant_and_index_propagation]: True",
|
| 644 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[always_keep_tensor_constants]: False",
|
| 645 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[assert_indirect_indexing]: True",
|
| 646 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[compute_all_bounds]: False",
|
| 647 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[combo_kernels]: False",
|
| 648 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[benchmark_combo_kernel]: False",
|
| 649 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[combo_kernels_autotune]: 1",
|
| 650 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[combo_kernel_allow_mixed_sizes]: 1",
|
| 651 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[combo_kernel_foreach_dynamic_shapes]: False",
|
| 652 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[joint_graph_constant_folding]: True",
|
| 653 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug_index_asserts]: False",
|
| 654 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[emulate_precision_casts]: False",
|
| 655 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[is_nightly_or_source]: False",
|
| 656 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[developer_warnings]: False",
|
| 657 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[optimize_scatter_upon_const_tensor]: True",
|
| 658 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[add_pre_grad_passes]: None",
|
| 659 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[remove_pre_grad_passes]: None",
|
| 660 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[global_cache_dir]: None",
|
| 661 |
+
"[j6c55jha5r2sdys2rwq7uqhtleea5dgjcye7nicfgft36v7xfvp] inductor_config[kernel_name_max_ops]: 10",
|
| 662 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[shape_padding]: True",
|
| 663 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[comprehensive_padding]: True",
|
| 664 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[pad_channels_last]: False",
|
| 665 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[disable_padding_cpu]: True",
|
| 666 |
+
"[ljdqgtysl3vdf7j6attlz5gmjg2ncihnveojfyubosplmkrjgra] inductor_config[padding_alignment_bytes]: 128",
|
| 667 |
+
"[dnnw5ks3yxrp7mwvihb2hh4tqx35ye637xt33x64kw4fvz2nyzg] inductor_config[padding_stride_threshold]: 1024",
|
| 668 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[pad_outputs]: False",
|
| 669 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[bw_outputs_user_visible]: True",
|
| 670 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[force_shape_pad]: False",
|
| 671 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[permute_fusion]: False",
|
| 672 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[profiler_mark_wrapper_call]: False",
|
| 673 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[generate_intermediate_hooks]: False",
|
| 674 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[debug_ir_traceback]: False",
|
| 675 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[profile_bandwidth]: False",
|
| 676 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[profile_bandwidth_regex]: ",
|
| 677 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[profile_bandwidth_output]: None",
|
| 678 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[profile_bandwidth_with_do_bench_using_profiling]: False",
|
| 679 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[disable_cpp_codegen]: False",
|
| 680 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[freezing]: False",
|
| 681 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[freezing_discard_parameters]: False",
|
| 682 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[decompose_mem_bound_mm]: False",
|
| 683 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[assume_aligned_inputs]: False",
|
| 684 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[unsafe_ignore_unsupported_triton_autotune_args]: False",
|
| 685 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[check_stack_no_cycles_TESTING_ONLY]: False",
|
| 686 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[enable_linear_binary_folding]: False",
|
| 687 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[annotate_training]: False",
|
| 688 |
+
"[sz3im5ogc6asp7g4uqocnovype63tkdexzfrniv6hn2oank3biu] inductor_config[cpp.threads]: -1",
|
| 689 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.no_redundant_loops]: True",
|
| 690 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.dynamic_threads]: False",
|
| 691 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.simdlen]: None",
|
| 692 |
+
"[g7rrnbg5yonzux3cfj5ovre5lob3ayda7qcfpxjvtwmiz4uicii] inductor_config[cpp.min_chunk_size]: 4096",
|
| 693 |
+
"[c7zj4qytmety6keurs3hsh5wn7foxp3dqx4kym2ucszzcb2ngrf] inductor_config[cpp.cxx]: (None, 'g++')",
|
| 694 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_kernel_profile]: False",
|
| 695 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.weight_prepack]: True",
|
| 696 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.inject_relu_bug_TESTING_ONLY]: None",
|
| 697 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.inject_log1p_bug_TESTING_ONLY]: None",
|
| 698 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.vec_isa_ok]: None",
|
| 699 |
+
"[yrty22bseefglnysuoec4ji7j2rnaggdj3g33zzj7avogwfmgdw] inductor_config[cpp.descriptive_names]: original_aten",
|
| 700 |
+
"[ebt2ncs4f5y7dn7btzi76mnouepvzad474tmp5iju4wiuumjl4s] inductor_config[cpp.max_horizontal_fusion_size]: 16",
|
| 701 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.fallback_scatter_reduce_sum]: True",
|
| 702 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_unsafe_math_opt_flag]: False",
|
| 703 |
+
"[ijs44lspkinjvhcs7uff7n3noc53jvsp4yfljjh22mafhb7khxe] inductor_config[cpp.enable_floating_point_contract_flag]: off",
|
| 704 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.enable_tiling_heuristics]: True",
|
| 705 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_grouped_gemm_template]: False",
|
| 706 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[cpp.gemm_max_k_slices]: 1",
|
| 707 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.gemm_cache_blocking]: None",
|
| 708 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cpp.gemm_thread_factors]: None",
|
| 709 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[cpp.enable_loop_tail_vec]: True",
|
| 710 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cpp.enable_concat_linear]: False",
|
| 711 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cudagraphs]: False",
|
| 712 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.cudagraph_trees]: True",
|
| 713 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cudagraph_skip_dynamic_graphs]: False",
|
| 714 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.slow_path_cudagraph_asserts]: True",
|
| 715 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cudagraph_trees_history_recording]: False",
|
| 716 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.cudagraph_support_input_mutation]: True",
|
| 717 |
+
"[ljdqgtysl3vdf7j6attlz5gmjg2ncihnveojfyubosplmkrjgra] inductor_config[triton.cudagraph_unexpected_rerecord_limit]: 128",
|
| 718 |
+
"[tuax46wac7rfv2trf5gcps6vleo3cq44lbnrdxtprvo3ljjaddj] inductor_config[triton.cudagraph_dynamic_shape_warn_limit]: 50",
|
| 719 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.force_cudagraph_sync]: False",
|
| 720 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.force_cudagraphs_warmup]: False",
|
| 721 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.fast_path_cudagraph_asserts]: False",
|
| 722 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.skip_cudagraph_warmup]: False",
|
| 723 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.debug_sync_graph]: False",
|
| 724 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.debug_sync_kernel]: False",
|
| 725 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.dense_indexing]: False",
|
| 726 |
+
"[pr5nr4a7dthirgd2ljo3d2xakc63ywxugusu6mkmr6gmpeliyib] inductor_config[triton.max_tiles]: 2",
|
| 727 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.prefer_nd_tiling]: False",
|
| 728 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.autotune_pointwise]: True",
|
| 729 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.autotune_cublasLt]: True",
|
| 730 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[triton.autotune_at_compile_time]: None",
|
| 731 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.tile_reductions]: False",
|
| 732 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.tiling_prevents_pointwise_fusion]: True",
|
| 733 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.tiling_prevents_reduction_fusion]: True",
|
| 734 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.unique_kernel_names]: True",
|
| 735 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.unique_user_kernel_names]: False",
|
| 736 |
+
"[yrty22bseefglnysuoec4ji7j2rnaggdj3g33zzj7avogwfmgdw] inductor_config[triton.descriptive_names]: original_aten",
|
| 737 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.persistent_reductions]: True",
|
| 738 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.cooperative_reductions]: False",
|
| 739 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.force_cooperative_reductions]: False",
|
| 740 |
+
"[vrl5ktomgtzox5xucd3np6vug3vyj6hwwzahqijuwpmamlv7ohi] inductor_config[triton.multi_kernel]: 0",
|
| 741 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.divisible_by_16]: True",
|
| 742 |
+
"[fv6slhtedtydps5s5u2etitscliblzcidyitqf7krsv4e23fzk6] inductor_config[triton.min_split_scan_rblock]: 256",
|
| 743 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.store_cubin]: False",
|
| 744 |
+
"[ebt2ncs4f5y7dn7btzi76mnouepvzad474tmp5iju4wiuumjl4s] inductor_config[triton.spill_threshold]: 16",
|
| 745 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.use_block_ptr]: False",
|
| 746 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[triton.inject_relu_bug_TESTING_ONLY]: None",
|
| 747 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[triton.codegen_upcast_to_fp32]: True",
|
| 748 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.enable_persistent_tma_matmul]: False",
|
| 749 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.skip_l1_cache]: False",
|
| 750 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[triton.disallow_failing_autotune_kernels_TESTING_ONLY]: False",
|
| 751 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[aot_inductor.output_path]: ",
|
| 752 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.debug_compile]: False",
|
| 753 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.compile_wrapper_with_O0]: False",
|
| 754 |
+
"[ngkkx5e6z7erl6da23zb2cmsctz4yvaqyameyg5hbqln4wrhh7x] inductor_config[aot_inductor.debug_intermediate_value_printer]: 0",
|
| 755 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[aot_inductor.filtered_kernel_names]: None",
|
| 756 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[aot_inductor.serialized_in_spec]: ",
|
| 757 |
+
"[v3hzzlv4tjgvp3pyhmzagjd25orl6n7nynoa7svlhhwk73b7u3c] inductor_config[aot_inductor.serialized_out_spec]: ",
|
| 758 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.use_runtime_constant_folding]: False",
|
| 759 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.force_mmap_weights]: False",
|
| 760 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.package]: False",
|
| 761 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.package_cpp_only]: False",
|
| 762 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[aot_inductor.metadata]: {}",
|
| 763 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[aot_inductor.raise_error_on_ignored_optimization]: True",
|
| 764 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.dump_aoti_minifier]: False",
|
| 765 |
+
"[pr5nr4a7dthirgd2ljo3d2xakc63ywxugusu6mkmr6gmpeliyib] inductor_config[aot_inductor.repro_level]: 2",
|
| 766 |
+
"[4bryyl4ahh5whyg3zwqebpwmjnx6w77nqgqbdjlowju6lkqtn7w] inductor_config[aot_inductor.presets]: {}",
|
| 767 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.allow_stack_allocation]: False",
|
| 768 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[aot_inductor.use_minimal_arrayref_interface]: False",
|
| 769 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[aot_inductor.package_constants_in_so]: True",
|
| 770 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.arch]: None",
|
| 771 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.version]: None",
|
| 772 |
+
"[tvyftmtdmezlejo2xllu7awzv4pzc4vm4fub4b3gpl5jptjkosi] inductor_config[cuda.compile_opt_level]: -O1",
|
| 773 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.enable_cuda_lto]: False",
|
| 774 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.enable_ptxas_info]: False",
|
| 775 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.enable_debug_info]: False",
|
| 776 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.use_fast_math]: False",
|
| 777 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cutlass_max_profiling_configs]: None",
|
| 778 |
+
"[xaicuyqjstadzph6cgvxowlzizkts6kzmfupsnbyaorxh37cppz] inductor_config[cuda.cutlass_max_profiling_swizzle_options]: [1, 2, 4]",
|
| 779 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cuda_cxx]: None",
|
| 780 |
+
"[aghvyrrgwvxijco2pk5wzc3cgmmthrbmgxitiibxuuscxdwrjd3] inductor_config[cuda.cutlass_backend_min_gemm_size]: 1",
|
| 781 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[cuda.generate_test_runner]: False",
|
| 782 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cutlass_op_allowlist_regex]: None",
|
| 783 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[cuda.cutlass_op_denylist_regex]: None",
|
| 784 |
+
"[ngkkx5e6z7erl6da23zb2cmsctz4yvaqyameyg5hbqln4wrhh7x] inductor_config[cuda.cutlass_instantiation_level]: 0",
|
| 785 |
+
"[h25wqx6vliw4j5rtzzbv6latydxyei3deyg6v7wzvnzryfktuki] inductor_config[rocm.arch]: []",
|
| 786 |
+
"[3w3j4h2iiu3addwyb5alaeecz3so7teb23hp4d5n3b46w5n73ur] inductor_config[rocm.ck_supported_arch]: ['gfx90a', 'gfx942']",
|
| 787 |
+
"[klfqjprnpfhcdurgvuikvc4rpd5ynkpk77toousr5h3u5roty6p] inductor_config[rocm.compile_opt_level]: -O2",
|
| 788 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.is_debug]: False",
|
| 789 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.save_temps]: False",
|
| 790 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[rocm.use_fast_math]: True",
|
| 791 |
+
"[cev5uo2jlwdhw2uyzcm7vr6cl23azjfw437f5r5lskm7spucos6] inductor_config[rocm.flush_denormals]: True",
|
| 792 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.print_kernel_resource_usage]: False",
|
| 793 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.rocm_home]: None",
|
| 794 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.ck_dir]: None",
|
| 795 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.generate_test_runner]: False",
|
| 796 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.n_max_profiling_configs]: None",
|
| 797 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[rocm.use_preselected_instances]: False",
|
| 798 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[rocm.kBatch_sweep]: None",
|
| 799 |
+
"[ebt2ncs4f5y7dn7btzi76mnouepvzad474tmp5iju4wiuumjl4s] inductor_config[rocm.split_k_threshold]: 16",
|
| 800 |
+
"[bsvfcwwoczx2rlkdz2eta6doujsymyihmi46hhwk6clrrvwcb6m] inductor_config[cpu_backend]: cpp",
|
| 801 |
+
"[caw4ly2z672k6kjfahoxwpajp5idhhtrpgf3ma2clylcp7c7aid] inductor_config[cuda_backend]: triton",
|
| 802 |
+
"[ljhgflgihidopsfsdcbqynv27nceykby3nutyd5jlcpq7n6e7l4] inductor_config[halide.cpu_target]: host",
|
| 803 |
+
"[wx7vmsmrdpk5ue2txlywp3lj3faqmdjphs5fgg2ehzsyno7uovg] inductor_config[halide.gpu_target]: host-cuda",
|
| 804 |
+
"[svgytlua5wcyeia7wq7e6zgh5tsueikrnzchmdmouvmkpfsc2zq] inductor_config[halide.scheduler_cuda]: Anderson2021",
|
| 805 |
+
"[k5ogk6345jvklsnu7g2njqstiz2g6pm5wmqpgg3kasrmuqwjvl6] inductor_config[halide.scheduler_cpu]: Adams2019",
|
| 806 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[halide.asserts]: False",
|
| 807 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[halide.debug]: False",
|
| 808 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[halide.scan_kernels]: False",
|
| 809 |
+
"[h25wqx6vliw4j5rtzzbv6latydxyei3deyg6v7wzvnzryfktuki] inductor_config[external_matmul]: []",
|
| 810 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[test_configs.force_extern_kernel_in_multi_template]: False",
|
| 811 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[test_configs.max_mm_configs]: None",
|
| 812 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[test_configs.runtime_triton_dtype_assert]: False",
|
| 813 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[test_configs.autotune_choice_name_regex]: None",
|
| 814 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] inductor_config[test_configs.autotune_choice_desc_regex]: None",
|
| 815 |
+
"[esstihe2nyydk4mhzpvox3qkajyu5y5t23hk3fi2me7jn75xi3o] inductor_config[test_configs.graphsafe_rng_func_ignores_fallback_random]: False",
|
| 816 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] post_grad_custom_pre_pass: None",
|
| 817 |
+
"[tquy2we2efmowuj4wuqzcfcfdcrkzkzmwdae6hprj7fa64jpusq] post_grad_custom_post_pass: None"
|
| 818 |
+
],
|
| 819 |
+
"fn_name": "compile_fx_inner",
|
| 820 |
+
"is_backward": false,
|
| 821 |
+
"key": "fr57fwh6rfk65wtgsmaeq6p7domzwaxezpig6cnku7tl6zrhoujz",
|
| 822 |
+
"local_cache_enabled": true,
|
| 823 |
+
"remote_cache_enabled": false
|
| 824 |
+
},
|
| 825 |
+
"cat": "dynamo_timed",
|
| 826 |
+
"name": "inductor_compile",
|
| 827 |
+
"ph": "E",
|
| 828 |
+
"pid": 0,
|
| 829 |
+
"tid": 0,
|
| 830 |
+
"ts": 1750251842527055.8
|
| 831 |
+
},
|
| 832 |
+
{
|
| 833 |
+
"args": {
|
| 834 |
+
"compile_id": "0/0"
|
| 835 |
+
},
|
| 836 |
+
"cat": "dynamo_timed",
|
| 837 |
+
"name": "compile_fx.<locals>.fw_compiler_base",
|
| 838 |
+
"ph": "E",
|
| 839 |
+
"pid": 0,
|
| 840 |
+
"tid": 0,
|
| 841 |
+
"ts": 1750251842528002.0
|
| 842 |
+
},
|
| 843 |
+
{
|
| 844 |
+
"args": {
|
| 845 |
+
"compile_id": "0/0"
|
| 846 |
+
},
|
| 847 |
+
"cat": "dynamo_timed",
|
| 848 |
+
"name": "create_aot_dispatcher_function",
|
| 849 |
+
"ph": "E",
|
| 850 |
+
"pid": 0,
|
| 851 |
+
"tid": 0,
|
| 852 |
+
"ts": 1750251842530288.2
|
| 853 |
+
},
|
| 854 |
+
{
|
| 855 |
+
"args": {
|
| 856 |
+
"cache_bypass_hard_exception": false,
|
| 857 |
+
"cache_bypass_reason": "Unsupported call_function target <class 'torch.autograd.function.FunctionCtx'>. \n Function module: torch.autograd.function, \nFunction name: FunctionCtx",
|
| 858 |
+
"cache_state": "bypass",
|
| 859 |
+
"compile_id": "0/0",
|
| 860 |
+
"components": [],
|
| 861 |
+
"key": null
|
| 862 |
+
},
|
| 863 |
+
"cat": "dynamo_timed",
|
| 864 |
+
"name": "autograd_cache_bypass",
|
| 865 |
+
"ph": "i",
|
| 866 |
+
"pid": 0,
|
| 867 |
+
"s": "p",
|
| 868 |
+
"tid": 0,
|
| 869 |
+
"ts": 1750251841793382.2
|
| 870 |
+
},
|
| 871 |
+
{
|
| 872 |
+
"args": {
|
| 873 |
+
"cache_bypass_reason": "Unsupported call_function target <class 'torch.autograd.function.FunctionCtx'>. \n Function module: torch.autograd.function, \nFunction name: FunctionCtx",
|
| 874 |
+
"cache_event_time": 1750251841793382207,
|
| 875 |
+
"cache_state": "bypass",
|
| 876 |
+
"compile_id": "0/0",
|
| 877 |
+
"components": [],
|
| 878 |
+
"dispatch_mode": "inference",
|
| 879 |
+
"fn_name": "OutputGraph.call_user_compiler",
|
| 880 |
+
"key": null,
|
| 881 |
+
"local_cache_enabled": true,
|
| 882 |
+
"remote_cache_enabled": false,
|
| 883 |
+
"requires_subclass_dispatch": false
|
| 884 |
+
},
|
| 885 |
+
"cat": "dynamo_timed",
|
| 886 |
+
"name": "backend_compile",
|
| 887 |
+
"ph": "E",
|
| 888 |
+
"pid": 0,
|
| 889 |
+
"tid": 0,
|
| 890 |
+
"ts": 1750251842544082.2
|
| 891 |
+
},
|
| 892 |
+
{
|
| 893 |
+
"args": {
|
| 894 |
+
"compile_id": "0/0",
|
| 895 |
+
"fn_name": "_compile.compile_inner"
|
| 896 |
+
},
|
| 897 |
+
"cat": "dynamo_timed",
|
| 898 |
+
"name": "entire_frame_compile",
|
| 899 |
+
"ph": "E",
|
| 900 |
+
"pid": 0,
|
| 901 |
+
"tid": 0,
|
| 902 |
+
"ts": 1750251842551017.2
|
| 903 |
+
},
|
| 904 |
+
{
|
| 905 |
+
"args": {
|
| 906 |
+
"compile_id": "0/0"
|
| 907 |
+
},
|
| 908 |
+
"cat": "dynamo_timed",
|
| 909 |
+
"name": "gc",
|
| 910 |
+
"ph": "B",
|
| 911 |
+
"pid": 0,
|
| 912 |
+
"tid": 0,
|
| 913 |
+
"ts": 1750251842551354.2
|
| 914 |
+
},
|
| 915 |
+
{
|
| 916 |
+
"args": {
|
| 917 |
+
"compile_id": "0/0"
|
| 918 |
+
},
|
| 919 |
+
"cat": "dynamo_timed",
|
| 920 |
+
"name": "gc",
|
| 921 |
+
"ph": "E",
|
| 922 |
+
"pid": 0,
|
| 923 |
+
"tid": 0,
|
| 924 |
+
"ts": 1750251842552469.2
|
| 925 |
+
},
|
| 926 |
+
{
|
| 927 |
+
"args": {
|
| 928 |
+
"accumulated_cache_size": 0,
|
| 929 |
+
"cache_size": 0,
|
| 930 |
+
"co_filename": "/shared_volume/repos/quark/bench_qdq.py",
|
| 931 |
+
"co_firstlineno": 7,
|
| 932 |
+
"co_name": "run_scaled_fake_quantize",
|
| 933 |
+
"compile_id": "0/0",
|
| 934 |
+
"compliant_custom_ops": [],
|
| 935 |
+
"distributed_ephemeral_timeout_us": 427407,
|
| 936 |
+
"dynamo_config": "{\"_autograd_backward_strict_mode_conditional_banned_ops\": [\"stride\", \"storage_offset\", \"is_contiguous\"], \"_unsafe_skip_fsdp_module_guards\": false, \"accumulated_recompile_limit\": 256, \"allow_complex_guards_as_runtime_asserts\": false, \"allow_empty_graphs\": false, \"allow_ignore_mark_dynamic\": false, \"allow_rnn\": false, \"allow_unspec_int_on_nn_module\": false, \"allowed_functions_module_string_ignorelist\": [\"torch._decomp\", \"torch._prims\", \"torch._refs\", \"torch.distributions\", \"torch.testing\"], \"assume_static_by_default\": true, \"automatic_dynamic_local_pgo\": true, \"automatic_dynamic_remote_pgo\": null, \"automatic_dynamic_shapes\": true, \"automatic_dynamic_shapes_mark_as\": \"dynamic\", \"capture_autograd_function\": true, \"capture_dynamic_output_shape_ops\": false, \"capture_func_transforms\": true, \"capture_scalar_outputs\": false, \"capture_sparse_compute\": true, \"compiled_autograd\": false, \"compiled_autograd_kwargs_override\": {}, \"cprofile\": false, \"cudagraph_backend_keep_input_mutation\": false, \"cudagraph_backend_support_input_mutation\": false, \"dead_code_elimination\": true, \"disable\": false, \"do_not_emit_runtime_asserts\": false, \"dynamic_shapes\": true, \"enable_compiler_collectives\": false, \"enable_cpp_framelocals_guard_eval\": true, \"enable_cpp_guard_manager\": true, \"enable_cpp_symbolic_shape_guards\": false, \"enable_faithful_generator_behavior\": true, \"enable_trace_contextlib\": true, \"error_on_nested_fx_trace\": true, \"error_on_nested_jit_trace\": true, \"error_on_recompile\": false, \"fail_on_recompile_limit_hit\": false, \"fake_tensor_cache_crosscheck_enabled\": false, \"fake_tensor_cache_enabled\": true, \"force_nn_module_property_static_shapes\": true, \"force_parameter_static_shapes\": true, \"force_unspec_int_unbacked_size_like_on_torchrec_kjt\": false, \"guard_nn_modules\": true, \"guard_nn_modules_using_dict_tags\": true, \"inline_inbuilt_nn_modules\": true, \"issue_3_13_0_warning\": true, \"minimum_call_count\": 1, \"numpy_default_complex\": \"complex128\", \"numpy_default_float\": \"float64\", \"numpy_default_int\": \"int64\", \"only_allow_pt2_compliant_ops\": false, \"optimize_ddp\": true, \"optimize_ddp_lazy_compile\": false, \"prefer_deferred_runtime_asserts_over_guards\": false, \"prepare_freezing\": false, \"raise_on_ctx_manager_usage\": true, \"raise_on_unsafe_aot_autograd\": false, \"recompile_limit\": 8, \"record_compile_time_instruction_count\": false, \"replay_record_enabled\": false, \"report_guard_failures\": true, \"rewrite_assert_with_torch_assert\": true, \"run_gc_after_compile\": true, \"skip_code_recursive_on_recompile_limit_hit\": true, \"skip_fsdp_guards\": true, \"skip_fsdp_hooks\": true, \"skip_nnmodule_hook_guards\": true, \"skip_no_tensor_aliasing_guards_on_parameters\": true, \"skip_tensor_guards_with_matching_dict_tags\": true, \"skip_torchrec\": true, \"skipfiles_inline_module_allowlist\": {}, \"specialize_float\": false, \"specialize_int\": false, \"suppress_errors\": false, \"trace_numpy\": true, \"track_nodes_for_deduplication\": false, \"use_graph_deduplication\": false, \"use_lazy_graph_module\": true, \"use_numpy_random_stream\": false, \"verify_correctness\": false}",
|
| 937 |
+
"dynamo_time_before_restart_s": 0.0,
|
| 938 |
+
"fail_reason": null,
|
| 939 |
+
"fail_type": null,
|
| 940 |
+
"fail_user_frame_filename": null,
|
| 941 |
+
"fail_user_frame_lineno": null,
|
| 942 |
+
"frame_key": "1",
|
| 943 |
+
"graph_input_count": 3,
|
| 944 |
+
"graph_node_count": 6,
|
| 945 |
+
"graph_op_count": 2,
|
| 946 |
+
"guard_count": 21,
|
| 947 |
+
"guard_latency_us": 0,
|
| 948 |
+
"has_guarded_code": true,
|
| 949 |
+
"non_compliant_ops": [
|
| 950 |
+
"quark::scaled_fake_quantize"
|
| 951 |
+
],
|
| 952 |
+
"restart_reasons": [],
|
| 953 |
+
"shape_env_guard_count": 0
|
| 954 |
+
},
|
| 955 |
+
"cat": "dynamo_timed",
|
| 956 |
+
"name": "dynamo",
|
| 957 |
+
"ph": "E",
|
| 958 |
+
"pid": 0,
|
| 959 |
+
"tid": 0,
|
| 960 |
+
"ts": 1750251842558796.5
|
| 961 |
+
}
|
| 962 |
+
]
|
compile_directory.json
ADDED
|
@@ -0,0 +1,78 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"[0/0]": {
|
| 3 |
+
"artifacts": [
|
| 4 |
+
{
|
| 5 |
+
"name": "dynamo_output_graph_0.txt",
|
| 6 |
+
"number": 0,
|
| 7 |
+
"suffix": "",
|
| 8 |
+
"url": "-_0_0_0/dynamo_output_graph_0.txt"
|
| 9 |
+
},
|
| 10 |
+
{
|
| 11 |
+
"name": "inductor_pre_grad_graph_1.txt",
|
| 12 |
+
"number": 1,
|
| 13 |
+
"suffix": "",
|
| 14 |
+
"url": "-_0_0_0/inductor_pre_grad_graph_1.txt"
|
| 15 |
+
},
|
| 16 |
+
{
|
| 17 |
+
"name": "before_recompile_pre_grad_2.txt",
|
| 18 |
+
"number": 2,
|
| 19 |
+
"suffix": "",
|
| 20 |
+
"url": "-_0_0_0/before_recompile_pre_grad_2.txt"
|
| 21 |
+
},
|
| 22 |
+
{
|
| 23 |
+
"name": "after_recompile_pre_grad_3.txt",
|
| 24 |
+
"number": 3,
|
| 25 |
+
"suffix": "",
|
| 26 |
+
"url": "-_0_0_0/after_recompile_pre_grad_3.txt"
|
| 27 |
+
},
|
| 28 |
+
{
|
| 29 |
+
"name": "aot_forward_graph_fw_metadata_4.txt",
|
| 30 |
+
"number": 4,
|
| 31 |
+
"suffix": "",
|
| 32 |
+
"url": "-_0_0_0/aot_forward_graph_fw_metadata_4.txt"
|
| 33 |
+
},
|
| 34 |
+
{
|
| 35 |
+
"name": "aot_inference_graph_5.txt",
|
| 36 |
+
"number": 5,
|
| 37 |
+
"suffix": "",
|
| 38 |
+
"url": "-_0_0_0/aot_inference_graph_5.txt"
|
| 39 |
+
},
|
| 40 |
+
{
|
| 41 |
+
"name": "torch._functorch.config_6.txt",
|
| 42 |
+
"number": 6,
|
| 43 |
+
"suffix": "",
|
| 44 |
+
"url": "-_0_0_0/torch._functorch.config_6.txt"
|
| 45 |
+
},
|
| 46 |
+
{
|
| 47 |
+
"name": "inductor_output_code_ch44xxkifazlcpkp6mi44xhqeej2j5mbgwmesiwx6y3oajzmixxp_7.html",
|
| 48 |
+
"number": 7,
|
| 49 |
+
"suffix": "",
|
| 50 |
+
"url": "-_0_0_0/inductor_output_code_ch44xxkifazlcpkp6mi44xhqeej2j5mbgwmesiwx6y3oajzmixxp_7.html"
|
| 51 |
+
},
|
| 52 |
+
{
|
| 53 |
+
"name": "fx_graph_cache_hit_8.json",
|
| 54 |
+
"number": 8,
|
| 55 |
+
"suffix": "✅",
|
| 56 |
+
"url": "-_0_0_0/fx_graph_cache_hit_8.json"
|
| 57 |
+
},
|
| 58 |
+
{
|
| 59 |
+
"name": "aotautograd_cache_bypass_9.json",
|
| 60 |
+
"number": 9,
|
| 61 |
+
"suffix": "❓",
|
| 62 |
+
"url": "-_0_0_0/aotautograd_cache_bypass_9.json"
|
| 63 |
+
},
|
| 64 |
+
{
|
| 65 |
+
"name": "dynamo_cpp_guards_str_10.txt",
|
| 66 |
+
"number": 10,
|
| 67 |
+
"suffix": "",
|
| 68 |
+
"url": "-_0_0_0/dynamo_cpp_guards_str_10.txt"
|
| 69 |
+
},
|
| 70 |
+
{
|
| 71 |
+
"name": "compilation_metrics_11.html",
|
| 72 |
+
"number": 11,
|
| 73 |
+
"suffix": "",
|
| 74 |
+
"url": "-_0_0_0/compilation_metrics_11.html"
|
| 75 |
+
}
|
| 76 |
+
]
|
| 77 |
+
}
|
| 78 |
+
}
|
failures_and_restarts.html
ADDED
|
@@ -0,0 +1,72 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
<html>
|
| 3 |
+
<head>
|
| 4 |
+
<style>
|
| 5 |
+
|
| 6 |
+
table {
|
| 7 |
+
width: 90%;
|
| 8 |
+
border-collapse: collapse;
|
| 9 |
+
margin: 20px 0;
|
| 10 |
+
}
|
| 11 |
+
table, th, td {
|
| 12 |
+
border: 1px solid #999;
|
| 13 |
+
padding: 10px;
|
| 14 |
+
text-align: left;
|
| 15 |
+
}
|
| 16 |
+
th {
|
| 17 |
+
background-color: #d3d3d3;
|
| 18 |
+
font-weight: bold;
|
| 19 |
+
}
|
| 20 |
+
tr:nth-child(odd) {
|
| 21 |
+
background-color: #f2f2f2;
|
| 22 |
+
}
|
| 23 |
+
a {
|
| 24 |
+
color: #0066cc;
|
| 25 |
+
text-decoration: none;
|
| 26 |
+
}
|
| 27 |
+
a:hover {
|
| 28 |
+
text-decoration: underline;
|
| 29 |
+
}
|
| 30 |
+
|
| 31 |
+
</style>
|
| 32 |
+
</head>
|
| 33 |
+
<body>
|
| 34 |
+
<h1>Failures and Restarts</h1>
|
| 35 |
+
<table>
|
| 36 |
+
<tr> <th> Compile Id </th> <th> Failure Type </th> <th> Failure Description </th> <th> Failure Source (compilation failures only) </th> </tr>
|
| 37 |
+
|
| 38 |
+
|
| 39 |
+
<script>
|
| 40 |
+
document.addEventListener('DOMContentLoaded', function() {
|
| 41 |
+
|
| 42 |
+
// Append the current URL's query parameters to all relative links on the page
|
| 43 |
+
const queryParams = new URLSearchParams(window.location.search);
|
| 44 |
+
if (queryParams.size === 0) return url; // No query params, return original URL
|
| 45 |
+
|
| 46 |
+
function appendQueryParams(url) {
|
| 47 |
+
const newURL = new URL((new Request(url)).url); // new URL(<relative URL>) but it actually works
|
| 48 |
+
const newSearchParams = new URLSearchParams(newURL.searchParams);
|
| 49 |
+
console.log(newURL.searchParams);
|
| 50 |
+
console.log(newSearchParams);
|
| 51 |
+
|
| 52 |
+
// Append query parameters
|
| 53 |
+
for (const [key, value] of queryParams) {
|
| 54 |
+
newSearchParams.set(key, value);
|
| 55 |
+
}
|
| 56 |
+
|
| 57 |
+
newURL.search = newSearchParams;
|
| 58 |
+
return newURL;
|
| 59 |
+
}
|
| 60 |
+
|
| 61 |
+
// Select all relative links on the page
|
| 62 |
+
const relativeLinks = document.querySelectorAll('a[href]:not([href^="http://"]):not([href^="https://"]):not([href^="\#"])');
|
| 63 |
+
|
| 64 |
+
// Append query parameters to each relative link
|
| 65 |
+
relativeLinks.forEach((link) => {
|
| 66 |
+
link.setAttribute("href", appendQueryParams(link.getAttribute("href")))
|
| 67 |
+
});
|
| 68 |
+
});
|
| 69 |
+
</script>
|
| 70 |
+
|
| 71 |
+
</body>
|
| 72 |
+
</html>
|
index.html
ADDED
|
@@ -0,0 +1,202 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
|
| 2 |
+
<html>
|
| 3 |
+
<head>
|
| 4 |
+
<meta charset="UTF-8">
|
| 5 |
+
</head>
|
| 6 |
+
<style>
|
| 7 |
+
|
| 8 |
+
table td { vertical-align: top; }
|
| 9 |
+
|
| 10 |
+
.stack-trie { white-space: nowrap; font-family: monospace; }
|
| 11 |
+
.stack-trie ul { padding-left: 1ch; }
|
| 12 |
+
.stack-trie li { margin-left: 1ch; list-style-type: none; }
|
| 13 |
+
.stack-trie .marker {
|
| 14 |
+
cursor: pointer;
|
| 15 |
+
}
|
| 16 |
+
.stack-trie .marker.collapsed::before {
|
| 17 |
+
content: "+ ";
|
| 18 |
+
}
|
| 19 |
+
.stack-trie .marker:not(.collapsed)::before {
|
| 20 |
+
content: "- ";
|
| 21 |
+
}
|
| 22 |
+
.stack-trie a { text-decoration: none; }
|
| 23 |
+
.stack-trie a:hover { text-decoration: underline; }
|
| 24 |
+
.status-missing { background-color: purple; color: white; }
|
| 25 |
+
.status-error { background-color: red; color: white; }
|
| 26 |
+
.status-empty { background-color: white; color: black; }
|
| 27 |
+
.status-ok { background-color: green; color: white; }
|
| 28 |
+
.status-break { background-color: lime; color: black; }
|
| 29 |
+
summary::-webkit-details-marker { color: #00ACF3; font-size: 125%; margin-right: 2px; }
|
| 30 |
+
summary:focus { outline-style: none; }
|
| 31 |
+
article > details > summary { font-size: 28px; margin-top: 16px; }
|
| 32 |
+
details > p { margin-left: 24px; }
|
| 33 |
+
details details summary { font-size: 16px; }
|
| 34 |
+
|
| 35 |
+
</style>
|
| 36 |
+
<script>
|
| 37 |
+
|
| 38 |
+
function toggleList(toggleItem) {
|
| 39 |
+
const listItem = toggleItem.parentNode;
|
| 40 |
+
const nestedList = listItem.querySelector('ul');
|
| 41 |
+
if (nestedList) {
|
| 42 |
+
nestedList.style.display = nestedList.style.display === 'none' ? 'block' : 'none';
|
| 43 |
+
|
| 44 |
+
// Toggle the collapse/expand indicator
|
| 45 |
+
toggleItem.classList.toggle('collapsed');
|
| 46 |
+
}
|
| 47 |
+
}
|
| 48 |
+
|
| 49 |
+
</script>
|
| 50 |
+
<body>
|
| 51 |
+
<div>
|
| 52 |
+
|
| 53 |
+
<h2>Stack trie</h2>
|
| 54 |
+
<p>
|
| 55 |
+
The <strong>stack trie</strong> is a way of getting a quick orientation on where all the
|
| 56 |
+
compilations in a model take place, esp., if you are compiling a codebase you are unfamiliar with.
|
| 57 |
+
It is a tree of stack frames, for all stacks that triggered PT2 compilation. If only a single
|
| 58 |
+
stack is in the tree, you will simply see a plain list of frames (most recent call last). With
|
| 59 |
+
multiple stacks, at every point where two stacks diverge from having a common prefix, we increase
|
| 60 |
+
the indentation of the list and have a separate sub-list per sub-tree.
|
| 61 |
+
</p>
|
| 62 |
+
<p>
|
| 63 |
+
Links to particular compilation are color coded by status:
|
| 64 |
+
<span class="status-ok">[Success]</span>,
|
| 65 |
+
<span class="status-break">[Success with restart (e.g., graph break)]</span>,
|
| 66 |
+
<span class="status-empty">[Empty graph]</span>,
|
| 67 |
+
<span class="status-error">[Error]</span>,
|
| 68 |
+
<span class="status-missing">[Metrics were missing]</span>
|
| 69 |
+
</p>
|
| 70 |
+
<details><summary>Stack</summary><div class='stack-trie'><ul><li>/shared_volume/repos/quark/bench_qdq.py:161 in <module><br> mean, median = do_bench(run_scaled_fake_quantize_comp, kwargs_scaled_fake_quantize, num_runs=num_runs, num_warmup=num_warmup, name="quark qdq")</li>
|
| 71 |
+
<li>/shared_volume/repos/quark/bench_qdq.py:70 in do_bench<br> f(**kwargs)</li>
|
| 72 |
+
<li><a href='#[0/0]' class='status-ok'>[0/0]</a> /shared_volume/repos/quark/bench_qdq.py:7 in run_scaled_fake_quantize<br> </li>
|
| 73 |
+
</ul></div></details>
|
| 74 |
+
</div>
|
| 75 |
+
<div>
|
| 76 |
+
|
| 77 |
+
<h2>IR dumps</h2>
|
| 78 |
+
<p>
|
| 79 |
+
The <strong>IR dumps</strong> collected dumped intermediate products from various points of the PT2
|
| 80 |
+
compilation process. The products are organized by compile id, and then sorted in chronological
|
| 81 |
+
order.
|
| 82 |
+
</p>
|
| 83 |
+
<p>
|
| 84 |
+
A <strong>compile id</strong> uniquely identifies are particular compilation inside a PT2
|
| 85 |
+
program. It is traditionally written as <code>[x/y]</code>, where the <strong>frame id</strong> x
|
| 86 |
+
identifies the particular Python frame which we are compiling, and <strong>frame compile
|
| 87 |
+
id</strong> y identifies how many times we've recompiled this same frame. For example,
|
| 88 |
+
<code>[0/0]</code> refers to the very first frame compiled by PT2; <code>[0/1]</code> refers to the
|
| 89 |
+
first recompilation of this frame, while <code>[1/0]</code> refers to a different frame, within
|
| 90 |
+
distinct code cache, which we are compiling next (perhaps because of a graph break). Although
|
| 91 |
+
Dynamo treats distinct frames as completely unrelated, a frame compilation could overlap with another
|
| 92 |
+
frame; for example, if you graph break in an inlined function, Dynamo will typically try to compile
|
| 93 |
+
the nested frame again on an inner frame. You can identify the hierarchical relationship between
|
| 94 |
+
frames by looking at the stack trie above.
|
| 95 |
+
</p>
|
| 96 |
+
<p>
|
| 97 |
+
In some situations, the compile id will have an extra signifier <code>[x/y_z]</code>, where z is the
|
| 98 |
+
<strong>attempt</strong> for this particular (re)compilation. Certain conditions will cause Dynamo to
|
| 99 |
+
restart analysis, when Dynamo discovers that it needs to undo a decision it previously made. The most
|
| 100 |
+
common cause of recompilation is a graph break in an inlined function call, which forces to restart
|
| 101 |
+
and avoid inlining the function in the first place.
|
| 102 |
+
</p>
|
| 103 |
+
<p>
|
| 104 |
+
When compiled autograd is enabled, the compile id will include a prefix signifier <code>[!a/x/y]</code>,
|
| 105 |
+
where a is the <strong>compiled autograd id</strong>. For instance, <code>[!0/-/-]</code> refers
|
| 106 |
+
to the first graph captured by compiled autograd. It is then traced by torch.compile as <code>[!0/x/y_z]</code>.
|
| 107 |
+
</p>
|
| 108 |
+
<p>
|
| 109 |
+
Here is a high level description of PT2's compilation phases, and the intermediate products each
|
| 110 |
+
phase generates:
|
| 111 |
+
</p>
|
| 112 |
+
<ol>
|
| 113 |
+
<li><em>Optional:</em> If compiled autograd is enabled, and we are processing a backward call, compiled autograd will trace the autograd graph from the autograd engine, and produce an FX graph <code>compiled_autograd_graph</code> that will be Dynamo traced. Otherwise, Dynamo will directly trace user's bytecode.</li>
|
| 114 |
+
<li>Dynamo symbolically evaluates the Python bytecode of a program, producing <code>dynamo_output_graph</code></li>
|
| 115 |
+
<li><em>Optional:</em> If <code>optimize_ddp</code> is enabled, the DDPOptimizer will split the Dynamo output graph to improve pipelining communications. Each split subgraph is <code>optimize_ddp_split_child_submod</code>, and the high level graph that plumbs the graphs together is <code>optimize_ddp_split_graph</code>. If there are multiple splits, each subsequent build product will be produced multiple times, one for each split.</li>
|
| 116 |
+
<li>AOTAutograd traces the (possibly split) Dynamo output graph, producing a <code>aot_joint_graph</code> if backwards is enabled. It then partitions the graph into <code>aot_forward_graph</code> and <code>aot_backward_graph</code>. If training is not needed, there may only be an <code>aot_inference_graph</code>.</li>
|
| 117 |
+
<li>Inductor will apply some post grad FX passes, producing <code>inductor_post_grad_graph</code></li>
|
| 118 |
+
<li>Inductor will perform code generation, producing the final <code>inductor_output_code</code> which will be executed at runtime. This output is a valid Python program and can be directly run.</li>
|
| 119 |
+
</ol>
|
| 120 |
+
|
| 121 |
+
|
| 122 |
+
<h2> Chromium Events </h2>
|
| 123 |
+
PT2 generates <a href='chromium_events.json'>Chromium Trace Events</a> in JSON on specific events during compilation.
|
| 124 |
+
You can download and view them in a tool like <a href='https://ui.perfetto.dev/'>Perfetto</a>.
|
| 125 |
+
|
| 126 |
+
<p>
|
| 127 |
+
Build products below:
|
| 128 |
+
</p>
|
| 129 |
+
<ul>
|
| 130 |
+
|
| 131 |
+
<li><a id="[0/0]">[0/0]</a>
|
| 132 |
+
<ul>
|
| 133 |
+
|
| 134 |
+
<li><a href="-_0_0_0/dynamo_output_graph_0.txt">-_0_0_0/dynamo_output_graph_0.txt</a> (0)</li>
|
| 135 |
+
|
| 136 |
+
<li><a href="-_0_0_0/inductor_pre_grad_graph_1.txt">-_0_0_0/inductor_pre_grad_graph_1.txt</a> (1)</li>
|
| 137 |
+
|
| 138 |
+
<li><a href="-_0_0_0/before_recompile_pre_grad_2.txt">-_0_0_0/before_recompile_pre_grad_2.txt</a> (2)</li>
|
| 139 |
+
|
| 140 |
+
<li><a href="-_0_0_0/after_recompile_pre_grad_3.txt">-_0_0_0/after_recompile_pre_grad_3.txt</a> (3)</li>
|
| 141 |
+
|
| 142 |
+
<li><a href="-_0_0_0/aot_forward_graph_fw_metadata_4.txt">-_0_0_0/aot_forward_graph_fw_metadata_4.txt</a> (4)</li>
|
| 143 |
+
|
| 144 |
+
<li><a href="-_0_0_0/aot_inference_graph_5.txt">-_0_0_0/aot_inference_graph_5.txt</a> (5)</li>
|
| 145 |
+
|
| 146 |
+
<li><a href="-_0_0_0/torch._functorch.config_6.txt">-_0_0_0/torch._functorch.config_6.txt</a> (6)</li>
|
| 147 |
+
|
| 148 |
+
<li><a href="-_0_0_0/inductor_output_code_ch44xxkifazlcpkp6mi44xhqeej2j5mbgwmesiwx6y3oajzmixxp_7.html">-_0_0_0/inductor_output_code_ch44xxkifazlcpkp6mi44xhqeej2j5mbgwmesiwx6y3oajzmixxp_7.html</a> (7)</li>
|
| 149 |
+
|
| 150 |
+
<li><a href="-_0_0_0/fx_graph_cache_hit_8.json">-_0_0_0/fx_graph_cache_hit_8.json</a> ✅ (8)</li>
|
| 151 |
+
|
| 152 |
+
<li><a href="-_0_0_0/aotautograd_cache_bypass_9.json">-_0_0_0/aotautograd_cache_bypass_9.json</a> ❓ (9)</li>
|
| 153 |
+
|
| 154 |
+
<li><a href="-_0_0_0/dynamo_cpp_guards_str_10.txt">-_0_0_0/dynamo_cpp_guards_str_10.txt</a> (10)</li>
|
| 155 |
+
|
| 156 |
+
<li><a href="-_0_0_0/compilation_metrics_11.html">-_0_0_0/compilation_metrics_11.html</a> (11)</li>
|
| 157 |
+
|
| 158 |
+
</ul>
|
| 159 |
+
</li>
|
| 160 |
+
|
| 161 |
+
</ul>
|
| 162 |
+
</div>
|
| 163 |
+
|
| 164 |
+
|
| 165 |
+
|
| 166 |
+
|
| 167 |
+
|
| 168 |
+
|
| 169 |
+
<script>
|
| 170 |
+
document.addEventListener('DOMContentLoaded', function() {
|
| 171 |
+
|
| 172 |
+
// Append the current URL's query parameters to all relative links on the page
|
| 173 |
+
const queryParams = new URLSearchParams(window.location.search);
|
| 174 |
+
if (queryParams.size === 0) return url; // No query params, return original URL
|
| 175 |
+
|
| 176 |
+
function appendQueryParams(url) {
|
| 177 |
+
const newURL = new URL((new Request(url)).url); // new URL(<relative URL>) but it actually works
|
| 178 |
+
const newSearchParams = new URLSearchParams(newURL.searchParams);
|
| 179 |
+
console.log(newURL.searchParams);
|
| 180 |
+
console.log(newSearchParams);
|
| 181 |
+
|
| 182 |
+
// Append query parameters
|
| 183 |
+
for (const [key, value] of queryParams) {
|
| 184 |
+
newSearchParams.set(key, value);
|
| 185 |
+
}
|
| 186 |
+
|
| 187 |
+
newURL.search = newSearchParams;
|
| 188 |
+
return newURL;
|
| 189 |
+
}
|
| 190 |
+
|
| 191 |
+
// Select all relative links on the page
|
| 192 |
+
const relativeLinks = document.querySelectorAll('a[href]:not([href^="http://"]):not([href^="https://"]):not([href^="\#"])');
|
| 193 |
+
|
| 194 |
+
// Append query parameters to each relative link
|
| 195 |
+
relativeLinks.forEach((link) => {
|
| 196 |
+
link.setAttribute("href", appendQueryParams(link.getAttribute("href")))
|
| 197 |
+
});
|
| 198 |
+
});
|
| 199 |
+
</script>
|
| 200 |
+
|
| 201 |
+
</body>
|
| 202 |
+
</html>
|
raw.log
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|