Upload folder using huggingface_hub

Browse files

Files changed (4) hide show

README.md +97 -0
albumentations_config_eval.json +1 -0
config.json +19 -0
model.safetensors +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,97 @@

+---
+library_name: segmentation-models-pytorch
+license: mit
+pipeline_tag: image-segmentation
+tags:
+- model_hub_mixin
+- pytorch_model_hub_mixin
+- segmentation-models-pytorch
+- semantic-segmentation
+- pytorch
+- dpt
+languages:
+- python
+---
+# DPT Model Card
+Table of Contents:
+- [Load trained model](#load-trained-model)
+- [Model init parameters](#model-init-parameters)
+- [Model metrics](#model-metrics)
+- [Dataset](#dataset)
+## Load trained model
+[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/qubvel/segmentation_models.pytorch/blob/main/examples/dpt_inference_pretrained.ipynb)
+1. Install requirements.
+```bash
+pip install -U segmentation_models_pytorch albumentations
+```
+2. Run inference.
+```python
+import torch
+import requests
+import numpy as np
+import albumentations as A
+import segmentation_models_pytorch as smp
+from PIL import Image
+device = "cuda" if torch.cuda.is_available() else "cpu"
+# Load pretrained model and preprocessing function
+checkpoint = "smp-hub/smp-hub/dpt-large-ade20k""
+model = smp.from_pretrained(checkpoint).eval().to(device)
+preprocessing = A.Compose.from_pretrained(checkpoint)
+# Load image
+url = "https://huggingface.co/datasets/hf-internal-testing/fixtures_ade20k/resolve/main/ADE_val_00000001.jpg"
+image = Image.open(requests.get(url, stream=True).raw)
+# Preprocess image
+np_image = np.array(image)
+normalized_image = preprocessing(image=np_image)["image"]
+input_tensor = torch.as_tensor(normalized_image)
+input_tensor = input_tensor.permute(2, 0, 1).unsqueeze(0)  # HWC -> BCHW
+input_tensor = input_tensor.to(device)
+# Perform inference
+with torch.no_grad():
+    output_mask = model(input_tensor)
+# Postprocess mask
+mask = torch.nn.functional.interpolate(
+    output_mask, size=(image.height, image.width), mode="bilinear", align_corners=False
+)
+mask = mask.argmax(1).cpu().numpy()  # argmax over predicted classes (channels dim)
+```
+## Model init parameters
+```python
+model_init_params = {
+    "encoder_name": "tu-vit_large_patch16_384",
+    "encoder_depth": 4,
+    "encoder_weights": None,
+    "encoder_output_indices": None,
+    "decoder_intermediate_channels": (256, 512, 1024, 1024),
+    "decoder_fusion_channels": 256,
+    "dynamic_img_size": True,
+    "in_channels": 3,
+    "classes": 150,
+    "activation": None,
+    "aux_params": None
+}
+```
+## Dataset
+Dataset name: [ADE20K](https://ade20k.csail.mit.edu/)
+## More Information
+- Library: https://github.com/qubvel/segmentation_models.pytorch
+- Docs: https://smp.readthedocs.io/en/latest/
+This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin)

albumentations_config_eval.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"__version__": "2.0.5", "transform": {"__class_fullname__": "Compose", "p": 1.0, "transforms": [{"__class_fullname__": "LongestMaxSize", "p": 1.0, "max_size": 480, "max_size_hw": null, "interpolation": 2, "mask_interpolation": 0}, {"__class_fullname__": "Normalize", "p": 1.0, "mean": [0.5, 0.5, 0.5], "std": [0.5, 0.5, 0.5], "max_pixel_value": 255.0, "normalization": "standard"}, {"__class_fullname__": "PadIfNeeded", "p": 1.0, "min_height": null, "min_width": null, "pad_height_divisor": 32, "pad_width_divisor": 32, "position": "center", "border_mode": 0, "fill": 0.0, "fill_mask": 0.0}], "bbox_params": null, "keypoint_params": null, "additional_targets": {}, "is_check_shapes": true}}

config.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+  "_model_class": "DPT",
+  "activation": null,
+  "aux_params": null,
+  "classes": 150,
+  "decoder_fusion_channels": 256,
+  "decoder_intermediate_channels": [
+    256,
+    512,
+    1024,
+    1024
+  ],
+  "dynamic_img_size": true,
+  "encoder_depth": 4,
+  "encoder_name": "tu-vit_large_patch16_384",
+  "encoder_output_indices": null,
+  "encoder_weights": null,
+  "in_channels": 3
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b527beda408b0d4614f5fee260542e0ecc4db3cb33a0664891f5d5ffc51564a5
+size 1377510920