@@ -468,7 +468,8 @@ def mvitv2_t(*, weights: Optional[MViTV2_T_Weights] = None, progress: bool = Tru
468
468
"""
469
469
Constructs a tiny MViTv2 architecture from
470
470
`MViTv2: Improved Multiscale Vision Transformers for Classification and Detection
471
- <https://arxiv.org/abs/2112.01526>`__.
471
+ <https://arxiv.org/abs/2112.01526>`__ and `Multiscale Vision Transformers
472
+ <https://arxiv.org/abs/2104.11227>`__.
472
473
473
474
Args:
474
475
weights (:class:`~torchvision.models.video.MViTV2_T_Weights`, optional): The
@@ -503,9 +504,10 @@ def mvitv2_t(*, weights: Optional[MViTV2_T_Weights] = None, progress: bool = Tru
503
504
504
505
def mvitv2_s (* , weights : Optional [MViTV2_S_Weights ] = None , progress : bool = True , ** kwargs : Any ) -> MViTv2 :
505
506
"""
506
- Constructs a tiny MViTv2 architecture from
507
+ Constructs a small MViTv2 architecture from
507
508
`MViTv2: Improved Multiscale Vision Transformers for Classification and Detection
508
- <https://arxiv.org/abs/2112.01526>`__.
509
+ <https://arxiv.org/abs/2112.01526>`__ and `Multiscale Vision Transformers
510
+ <https://arxiv.org/abs/2104.11227>`__.
509
511
510
512
Args:
511
513
weights (:class:`~torchvision.models.video.MViTV2_S_Weights`, optional): The
@@ -540,9 +542,10 @@ def mvitv2_s(*, weights: Optional[MViTV2_S_Weights] = None, progress: bool = Tru
540
542
541
543
def mvitv2_b (* , weights : Optional [MViTV2_B_Weights ] = None , progress : bool = True , ** kwargs : Any ) -> MViTv2 :
542
544
"""
543
- Constructs a tiny MViTv2 architecture from
545
+ Constructs a base MViTv2 architecture from
544
546
`MViTv2: Improved Multiscale Vision Transformers for Classification and Detection
545
- <https://arxiv.org/abs/2112.01526>`__.
547
+ <https://arxiv.org/abs/2112.01526>`__ and `Multiscale Vision Transformers
548
+ <https://arxiv.org/abs/2104.11227>`__.
546
549
547
550
Args:
548
551
weights (:class:`~torchvision.models.video.MViTV2_B_Weights`, optional): The
0 commit comments