Update README.md
Browse files
README.md
CHANGED
|
@@ -35,17 +35,17 @@ The species list is derived from the Collins bird guide [^1].
|
|
| 35 |
import birder
|
| 36 |
from birder.inference.classification import infer_image
|
| 37 |
|
| 38 |
-
(net,
|
| 39 |
|
| 40 |
# Get the image size the model was trained on
|
| 41 |
-
size = birder.get_size_from_signature(signature)
|
| 42 |
|
| 43 |
# Create an inference transform
|
| 44 |
-
transform = birder.classification_transform(size, rgb_stats)
|
| 45 |
|
| 46 |
image = "path/to/image.jpeg" # or a PIL image, must be loaded in RGB format
|
| 47 |
(out, _) = infer_image(net, image, transform)
|
| 48 |
-
# out is a NumPy array with shape of (1,
|
| 49 |
```
|
| 50 |
|
| 51 |
### Image Embeddings
|
|
@@ -54,17 +54,17 @@ image = "path/to/image.jpeg" # or a PIL image, must be loaded in RGB format
|
|
| 54 |
import birder
|
| 55 |
from birder.inference.classification import infer_image
|
| 56 |
|
| 57 |
-
(net,
|
| 58 |
|
| 59 |
# Get the image size the model was trained on
|
| 60 |
-
size = birder.get_size_from_signature(signature)
|
| 61 |
|
| 62 |
# Create an inference transform
|
| 63 |
-
transform = birder.classification_transform(size, rgb_stats)
|
| 64 |
|
| 65 |
image = "path/to/image.jpeg" # or a PIL image
|
| 66 |
(out, embedding) = infer_image(net, image, transform, return_embedding=True)
|
| 67 |
-
# embedding is a NumPy array with shape of (1,
|
| 68 |
```
|
| 69 |
|
| 70 |
### Detection Feature Map
|
|
@@ -73,13 +73,13 @@ image = "path/to/image.jpeg" # or a PIL image
|
|
| 73 |
from PIL import Image
|
| 74 |
import birder
|
| 75 |
|
| 76 |
-
(net,
|
| 77 |
|
| 78 |
# Get the image size the model was trained on
|
| 79 |
-
size = birder.get_size_from_signature(signature)
|
| 80 |
|
| 81 |
# Create an inference transform
|
| 82 |
-
transform = birder.classification_transform(size, rgb_stats)
|
| 83 |
|
| 84 |
image = Image.open("path/to/image.jpeg")
|
| 85 |
features = net.detection_features(transform(image).unsqueeze(0))
|
|
@@ -96,12 +96,12 @@ print([(k, v.size()) for k, v in features.items()])
|
|
| 96 |
|
| 97 |
```bibtex
|
| 98 |
@misc{woo2023convnextv2codesigningscaling,
|
| 99 |
-
title={ConvNeXt V2: Co-designing and Scaling ConvNets with Masked Autoencoders},
|
| 100 |
author={Sanghyun Woo and Shoubhik Debnath and Ronghang Hu and Xinlei Chen and Zhuang Liu and In So Kweon and Saining Xie},
|
| 101 |
year={2023},
|
| 102 |
eprint={2301.00808},
|
| 103 |
archivePrefix={arXiv},
|
| 104 |
primaryClass={cs.CV},
|
| 105 |
-
url={https://arxiv.org/abs/2301.00808},
|
| 106 |
}
|
| 107 |
```
|
|
|
|
| 35 |
import birder
|
| 36 |
from birder.inference.classification import infer_image
|
| 37 |
|
| 38 |
+
(net, model_info) = birder.load_pretrained_model("convnext_v2_tiny_intermediate-eu-common", inference=True)
|
| 39 |
|
| 40 |
# Get the image size the model was trained on
|
| 41 |
+
size = birder.get_size_from_signature(model_info.signature)
|
| 42 |
|
| 43 |
# Create an inference transform
|
| 44 |
+
transform = birder.classification_transform(size, model_info.rgb_stats)
|
| 45 |
|
| 46 |
image = "path/to/image.jpeg" # or a PIL image, must be loaded in RGB format
|
| 47 |
(out, _) = infer_image(net, image, transform)
|
| 48 |
+
# out is a NumPy array with shape of (1, 707), representing class probabilities.
|
| 49 |
```
|
| 50 |
|
| 51 |
### Image Embeddings
|
|
|
|
| 54 |
import birder
|
| 55 |
from birder.inference.classification import infer_image
|
| 56 |
|
| 57 |
+
(net, model_info) = birder.load_pretrained_model("convnext_v2_tiny_intermediate-eu-common", inference=True)
|
| 58 |
|
| 59 |
# Get the image size the model was trained on
|
| 60 |
+
size = birder.get_size_from_signature(model_info.signature)
|
| 61 |
|
| 62 |
# Create an inference transform
|
| 63 |
+
transform = birder.classification_transform(size, model_info.rgb_stats)
|
| 64 |
|
| 65 |
image = "path/to/image.jpeg" # or a PIL image
|
| 66 |
(out, embedding) = infer_image(net, image, transform, return_embedding=True)
|
| 67 |
+
# embedding is a NumPy array with shape of (1, 768)
|
| 68 |
```
|
| 69 |
|
| 70 |
### Detection Feature Map
|
|
|
|
| 73 |
from PIL import Image
|
| 74 |
import birder
|
| 75 |
|
| 76 |
+
(net, model_info) = birder.load_pretrained_model("convnext_v2_tiny_intermediate-eu-common", inference=True)
|
| 77 |
|
| 78 |
# Get the image size the model was trained on
|
| 79 |
+
size = birder.get_size_from_signature(model_info.signature)
|
| 80 |
|
| 81 |
# Create an inference transform
|
| 82 |
+
transform = birder.classification_transform(size, model_info.rgb_stats)
|
| 83 |
|
| 84 |
image = Image.open("path/to/image.jpeg")
|
| 85 |
features = net.detection_features(transform(image).unsqueeze(0))
|
|
|
|
| 96 |
|
| 97 |
```bibtex
|
| 98 |
@misc{woo2023convnextv2codesigningscaling,
|
| 99 |
+
title={ConvNeXt V2: Co-designing and Scaling ConvNets with Masked Autoencoders},
|
| 100 |
author={Sanghyun Woo and Shoubhik Debnath and Ronghang Hu and Xinlei Chen and Zhuang Liu and In So Kweon and Saining Xie},
|
| 101 |
year={2023},
|
| 102 |
eprint={2301.00808},
|
| 103 |
archivePrefix={arXiv},
|
| 104 |
primaryClass={cs.CV},
|
| 105 |
+
url={https://arxiv.org/abs/2301.00808},
|
| 106 |
}
|
| 107 |
```
|