Spaces:
Running
Running
Update index.html
Browse files- index.html +18 -9
index.html
CHANGED
|
@@ -120,6 +120,9 @@
|
|
| 120 |
const attentionBq = includeBias ? hiddenSize : 0;
|
| 121 |
const attentionBk = includeBias ? numKeyValueHeads : 0;
|
| 122 |
const attentionBv = includeBias ? numKeyValueHeads : 0;
|
|
|
|
|
|
|
|
|
|
| 123 |
const attentionTotal = 2 * (attentionQ + attentionBq) + 2 * (attentionK + attentionBk) + 2 * (attentionV + attentionBv);
|
| 124 |
|
| 125 |
// Feed Forward calculations
|
|
@@ -145,23 +148,27 @@
|
|
| 145 |
|
| 146 |
// Display results
|
| 147 |
const attentionTable = document.getElementById('attention_table');
|
| 148 |
-
attentionTable.innerHTML = `
|
| 149 |
-
<tr><th>Type</th><th>
|
| 150 |
-
<tr><td>
|
|
|
|
|
|
|
| 151 |
${includeBias ? `<tr class="bias-row"><td>Bias</td><td>${attentionBq.toLocaleString()}</td><td>${attentionBk.toLocaleString()}</td><td>${attentionBv.toLocaleString()}</td><td></td></tr>` : ''}
|
| 152 |
`;
|
| 153 |
|
| 154 |
const feedForwardTable = document.getElementById('feed_forward_table');
|
| 155 |
feedForwardTable.innerHTML = `
|
| 156 |
-
<tr><th>Type</th><th>
|
| 157 |
-
<tr><td>
|
|
|
|
|
|
|
| 158 |
${includeBias ? `<tr class="bias-row"><td>Bias</td><td>${switchB.toLocaleString()}</td><td>${luB.toLocaleString()}</td><td>${projB.toLocaleString()}</td><td></td></tr>` : ''}
|
| 159 |
`;
|
| 160 |
|
| 161 |
const embeddingTable = document.getElementById('embedding_table');
|
| 162 |
embeddingTable.innerHTML = `
|
| 163 |
-
<tr><th>Type</th><th>Total</th></tr>
|
| 164 |
-
<tr><td>Embedding</td><td>${embeddingTotal.toLocaleString()}</td></tr>
|
| 165 |
`;
|
| 166 |
|
| 167 |
document.getElementById('one_layer_params').innerText = oneLayerParams.toLocaleString();
|
|
@@ -204,6 +211,10 @@
|
|
| 204 |
<div class="output">
|
| 205 |
<h3>Model Parameter Results</h3>
|
| 206 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 207 |
<div class="section-title">Attention Parameters</div>
|
| 208 |
<table id="attention_table" class="sub-table"></table>
|
| 209 |
|
|
@@ -214,8 +225,6 @@
|
|
| 214 |
<table id="embedding_table" class="sub-table"></table>
|
| 215 |
|
| 216 |
<div class="highlight">
|
| 217 |
-
<strong>1 Layer Parameters:</strong> <span id="one_layer_params">0</span><br>
|
| 218 |
-
<strong>Full Layers Parameters:</strong> <span id="full_layers_params">0</span><br>
|
| 219 |
<strong>Complete Model Size:</strong> <span id="full_size">0</span>
|
| 220 |
</div>
|
| 221 |
</div>
|
|
|
|
| 120 |
const attentionBq = includeBias ? hiddenSize : 0;
|
| 121 |
const attentionBk = includeBias ? numKeyValueHeads : 0;
|
| 122 |
const attentionBv = includeBias ? numKeyValueHeads : 0;
|
| 123 |
+
const attentionQOutput = hiddenSize;
|
| 124 |
+
const attentionKOutput = numKeyValueHeads;
|
| 125 |
+
const attentionVOutput = numKeyValueHeads;
|
| 126 |
const attentionTotal = 2 * (attentionQ + attentionBq) + 2 * (attentionK + attentionBk) + 2 * (attentionV + attentionBv);
|
| 127 |
|
| 128 |
// Feed Forward calculations
|
|
|
|
| 148 |
|
| 149 |
// Display results
|
| 150 |
const attentionTable = document.getElementById('attention_table');
|
| 151 |
+
attentionTable.innerHTML = `
|
| 152 |
+
<tr><th>Type</th><th>Input Size</th><th>Output Size</th><th>Total Size</th></tr>
|
| 153 |
+
<tr><td>Q</td><td>${hiddenSize.toLocaleString()}</td><td>${attentionQOutput.toLocaleString()}</td><td>${(hiddenSize * attentionQOutput).toLocaleString()}</td></tr>
|
| 154 |
+
<tr><td>K</td><td>${hiddenSize.toLocaleString()}</td><td>${attentionKOutput.toLocaleString()}</td><td>${(hiddenSize * attentionKOutput).toLocaleString()}</td></tr>
|
| 155 |
+
<tr><td>V</td><td>${hiddenSize.toLocaleString()}</td><td>${attentionVOutput.toLocaleString()}</td><td>${(hiddenSize * attentionVOutput).toLocaleString()}</td></tr>
|
| 156 |
${includeBias ? `<tr class="bias-row"><td>Bias</td><td>${attentionBq.toLocaleString()}</td><td>${attentionBk.toLocaleString()}</td><td>${attentionBv.toLocaleString()}</td><td></td></tr>` : ''}
|
| 157 |
`;
|
| 158 |
|
| 159 |
const feedForwardTable = document.getElementById('feed_forward_table');
|
| 160 |
feedForwardTable.innerHTML = `
|
| 161 |
+
<tr><th>Type</th><th>Input Size</th><th>Output Size</th><th>Total Size</th></tr>
|
| 162 |
+
<tr><td>Switch W</td><td>${hiddenSize.toLocaleString()}</td><td>${intermediateSize.toLocaleString()}</td><td>${(hiddenSize * intermediateSize).toLocaleString()}</td></tr>
|
| 163 |
+
<tr><td>LU W</td><td>${hiddenSize.toLocaleString()}</td><td>${intermediateSize.toLocaleString()}</td><td>${(hiddenSize * intermediateSize).toLocaleString()}</td></tr>
|
| 164 |
+
<tr><td>Proj W</td><td>${intermediateSize.toLocaleString()}</td><td>${hiddenSize.toLocaleString()}</td><td>${(intermediateSize * hiddenSize).toLocaleString()}</td></tr>
|
| 165 |
${includeBias ? `<tr class="bias-row"><td>Bias</td><td>${switchB.toLocaleString()}</td><td>${luB.toLocaleString()}</td><td>${projB.toLocaleString()}</td><td></td></tr>` : ''}
|
| 166 |
`;
|
| 167 |
|
| 168 |
const embeddingTable = document.getElementById('embedding_table');
|
| 169 |
embeddingTable.innerHTML = `
|
| 170 |
+
<tr><th>Type</th><th>Input Size</th><th>Output Size</th><th>Total Size</th></tr>
|
| 171 |
+
<tr><td>Embedding</td><td>${vocabSize.toLocaleString()}</td><td>${hiddenSize.toLocaleString()}</td><td>${embeddingTotal.toLocaleString()}</td></tr>
|
| 172 |
`;
|
| 173 |
|
| 174 |
document.getElementById('one_layer_params').innerText = oneLayerParams.toLocaleString();
|
|
|
|
| 211 |
<div class="output">
|
| 212 |
<h3>Model Parameter Results</h3>
|
| 213 |
|
| 214 |
+
<div class="section-title">1 Layer Parameters</div>
|
| 215 |
+
<div><strong>1 Layer Parameters:</strong> <span id="one_layer_params">0</span></div>
|
| 216 |
+
<div><strong>Full Layers Parameters:</strong> <span id="full_layers_params">0</span></div>
|
| 217 |
+
|
| 218 |
<div class="section-title">Attention Parameters</div>
|
| 219 |
<table id="attention_table" class="sub-table"></table>
|
| 220 |
|
|
|
|
| 225 |
<table id="embedding_table" class="sub-table"></table>
|
| 226 |
|
| 227 |
<div class="highlight">
|
|
|
|
|
|
|
| 228 |
<strong>Complete Model Size:</strong> <span id="full_size">0</span>
|
| 229 |
</div>
|
| 230 |
</div>
|