@@ -699,6 +699,12 @@ def resnet34(*, weights: Optional[ResNet34_Weights] = None, progress: bool = Tru
699699def resnet50 (* , weights : Optional [ResNet50_Weights ] = None , progress : bool = True , ** kwargs : Any ) -> ResNet :
700700 """ResNet-50 from `Deep Residual Learning for Image Recognition <https://arxiv.org/pdf/1512.03385.pdf>`__.
701701
702+ .. note::
703+ The bottleneck of TorchVision places the stride for downsampling to the second 3x3
704+ convolution while the original paper places it to the first 1x1 convolution.
705+ This variant improves the accuracy and is known as `ResNet V1.5
706+ <https://ngc.nvidia.com/catalog/model-scripts/nvidia:resnet_50_v1_5_for_pytorch>`_.
707+
702708 Args:
703709 weights (:class:`~torchvision.models.ResNet50_Weights`, optional): The
704710 pretrained weights to use. See
@@ -724,6 +730,12 @@ def resnet50(*, weights: Optional[ResNet50_Weights] = None, progress: bool = Tru
724730def resnet101 (* , weights : Optional [ResNet101_Weights ] = None , progress : bool = True , ** kwargs : Any ) -> ResNet :
725731 """ResNet-101 from `Deep Residual Learning for Image Recognition <https://arxiv.org/pdf/1512.03385.pdf>`__.
726732
733+ .. note::
734+ The bottleneck of TorchVision places the stride for downsampling to the second 3x3
735+ convolution while the original paper places it to the first 1x1 convolution.
736+ This variant improves the accuracy and is known as `ResNet V1.5
737+ <https://ngc.nvidia.com/catalog/model-scripts/nvidia:resnet_50_v1_5_for_pytorch>`_.
738+
727739 Args:
728740 weights (:class:`~torchvision.models.ResNet101_Weights`, optional): The
729741 pretrained weights to use. See
@@ -749,6 +761,12 @@ def resnet101(*, weights: Optional[ResNet101_Weights] = None, progress: bool = T
749761def resnet152 (* , weights : Optional [ResNet152_Weights ] = None , progress : bool = True , ** kwargs : Any ) -> ResNet :
750762 """ResNet-152 from `Deep Residual Learning for Image Recognition <https://arxiv.org/pdf/1512.03385.pdf>`__.
751763
764+ .. note::
765+ The bottleneck of TorchVision places the stride for downsampling to the second 3x3
766+ convolution while the original paper places it to the first 1x1 convolution.
767+ This variant improves the accuracy and is known as `ResNet V1.5
768+ <https://ngc.nvidia.com/catalog/model-scripts/nvidia:resnet_50_v1_5_for_pytorch>`_.
769+
752770 Args:
753771 weights (:class:`~torchvision.models.ResNet152_Weights`, optional): The
754772 pretrained weights to use. See
0 commit comments