Instructions to use RGBD-SOD/custom-resnet50d with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Transformers
How to use RGBD-SOD/custom-resnet50d with Transformers:
# Use a pipeline as a high-level helper from transformers import pipeline pipe = pipeline("feature-extraction", model="RGBD-SOD/custom-resnet50d", trust_remote_code=True)# Load model directly from transformers import AutoModel model = AutoModel.from_pretrained("RGBD-SOD/custom-resnet50d", trust_remote_code=True, dtype="auto") - Notebooks
- Google Colab
- Kaggle
| from typing import Dict | |
| import timm | |
| from timm.models.resnet import BasicBlock, Bottleneck, ResNet | |
| from torch import Tensor, nn | |
| from transformers import PreTrainedModel | |
| from .configuration_resnet import ResnetConfig | |
| BLOCK_MAPPING = {"basic": BasicBlock, "bottleneck": Bottleneck} | |
| class ResnetModel(PreTrainedModel): | |
| """ | |
| The line that sets the config_class is not mandatory, | |
| unless you want to register your model with the auto classes | |
| """ | |
| config_class = ResnetConfig | |
| def __init__(self, config: ResnetConfig): | |
| super().__init__(config) | |
| block_layer = BLOCK_MAPPING[config.block_type] | |
| self.model = ResNet( | |
| block_layer, | |
| config.layers, | |
| num_classes=config.num_classes, | |
| in_chans=config.input_channels, | |
| cardinality=config.cardinality, | |
| base_width=config.base_width, | |
| stem_width=config.stem_width, | |
| stem_type=config.stem_type, | |
| avg_down=config.avg_down, | |
| ) | |
| def forward(self, tensor: Tensor) -> Tensor: | |
| return self.model.forward_features(tensor) | |
| class ResnetModelForImageClassification(PreTrainedModel): | |
| """ | |
| The line that sets the config_class is not mandatory, | |
| unless you want to register your model with the auto classes | |
| """ | |
| config_class = ResnetConfig | |
| def __init__(self, config: ResnetConfig): | |
| super().__init__(config) | |
| self.model = ResnetModel(config) | |
| """ | |
| You can have your model return anything you want, | |
| but returning a dictionary like we did for ResnetModelForImageClassification, | |
| with the loss included when labels are passed, | |
| will make your model directly usable inside the Trainer class. | |
| Using another output format is fine as long as you are planning on | |
| using your own training loop or another library for training. | |
| """ | |
| def forward(self, tensor: Tensor, labels=None) -> Dict[str, Tensor]: | |
| logits = self.model(tensor) | |
| if labels is not None: | |
| loss = nn.cross_entropy(logits, labels) | |
| return {"loss": loss, "logits": logits} | |
| return {"logits": logits} | |
| if __name__ == "__main__": | |
| resnet50d_config = ResnetConfig.from_pretrained("custom-resnet") | |
| resnet50d = ResnetModelForImageClassification(resnet50d_config) | |
| # Load pretrained weights from timm | |
| pretrained_model: nn.Module = timm.create_model("resnet50d", pretrained=True) | |
| resnet50d.model.load_state_dict(pretrained_model.state_dict()) | |