Upload quantized model and evaluation results
Browse files- README.md +16 -0
- __pycache__/model.cpython-310.pyc +0 -0
- eval_results.json +1 -0
- liteml_config.yaml +18 -0
- metadata.yaml +8 -0
- model.py +7 -0
- quantized_model.pth +3 -0
README.md
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
# 🧠 Model: Alexnet
|
| 2 |
+
|
| 3 |
+
This is a quantized version of `Alexnet` using `W8A8 static` quantization.
|
| 4 |
+
|
| 5 |
+
## 🧪 Evaluation Summary
|
| 6 |
+
|
| 7 |
+
| Metric | FP32 | Quantized |
|
| 8 |
+
|----------------|------------------|------------|
|
| 9 |
+
| Top-1 Accuracy | 0.555 | 0.5357142686843872 |
|
| 10 |
+
| Top-5 Accuracy | 0.777 | 0.788690447807312 |
|
| 11 |
+
|
| 12 |
+
- Dataset: `ImageNet`
|
| 13 |
+
- Evaluation Date: `2025-07-18`
|
| 14 |
+
|
| 15 |
+
## 🔍 Notes
|
| 16 |
+
Quantized W8A8 Resnet50 model from torchvision
|
__pycache__/model.cpython-310.pyc
ADDED
|
Binary file (397 Bytes). View file
|
|
|
eval_results.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"top1": 0.5357142686843872, "top5": 0.788690447807312}
|
liteml_config.yaml
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
QAT:
|
| 2 |
+
device: "cuda"
|
| 3 |
+
fully_quantized: True
|
| 4 |
+
data_quantization:
|
| 5 |
+
status: On
|
| 6 |
+
bits: 8
|
| 7 |
+
custom_bits: {}
|
| 8 |
+
symmetric: On
|
| 9 |
+
quantization_mode: static
|
| 10 |
+
observer: "MovingAverage"
|
| 11 |
+
per_channel: False
|
| 12 |
+
|
| 13 |
+
weights_quantization:
|
| 14 |
+
status: On
|
| 15 |
+
bits: 8
|
| 16 |
+
custom_bits: {}
|
| 17 |
+
symmetric: On
|
| 18 |
+
per_channel: False
|
metadata.yaml
ADDED
|
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
model_name: Alexnet
|
| 2 |
+
liteml_config: 'liteml_config.yaml'
|
| 3 |
+
quantization_type: W8A8 static
|
| 4 |
+
dataset: ImageNet
|
| 5 |
+
notes: Quantized W8A8 Resnet50 model from torchvision
|
| 6 |
+
# TODO: move float accuracy somewhere else
|
| 7 |
+
top1_float: 0.555
|
| 8 |
+
top5_float: 0.777
|
model.py
ADDED
|
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import torch
|
| 2 |
+
device = "cuda" if torch.cuda.is_available() else "cpu"
|
| 3 |
+
|
| 4 |
+
|
| 5 |
+
def get_model():
|
| 6 |
+
from torchvision.models import alexnet
|
| 7 |
+
return alexnet(weights='IMAGENET1K_V1').to(device)
|
quantized_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9acca062fc682969c778761026f0a92bebf373c3629f86db9e501ce3925ea8d0
|
| 3 |
+
size 244448061
|