Loading zoo/ccip/backbone.py +2 −1 Original line number Diff line number Diff line Loading @@ -5,7 +5,7 @@ import clip import torch from torchvision.transforms import Compose from .caformer import get_caformer from .caformer import get_caformer, get_caformer_s18 def get_clip_backbone(name="ViT-B/32") -> Tuple[torch.nn.Module, Compose]: Loading @@ -22,6 +22,7 @@ def register_backbone(name, func, *args, **kwargs): register_backbone('caformer', get_caformer) register_backbone('caformer_s18', get_caformer_s18) def get_backbone(name: str) -> Tuple[torch.nn.Module, Compose]: Loading zoo/ccip/caformer.py +7 −0 Original line number Diff line number Diff line Loading @@ -32,3 +32,10 @@ def get_caformer(input_resolution: int = 384, heads: int = 8, feat_dims: int = 7 ] return CaformerBackbone(input_resolution, heads, feat_dims, **kwargs), transform def get_caformer_s18(input_resolution: int = 384, heads: int = 8, feat_dims: int = 768, **kwargs): transform = [ Normalize((0.48145466, 0.4578275, 0.40821073), (0.26862954, 0.26130258, 0.27577711)), ] return CaformerBackbone(input_resolution, heads, feat_dims, arch='caformer_s18_384_in21ft1k', **kwargs), transform No newline at end of file Loading
zoo/ccip/backbone.py +2 −1 Original line number Diff line number Diff line Loading @@ -5,7 +5,7 @@ import clip import torch from torchvision.transforms import Compose from .caformer import get_caformer from .caformer import get_caformer, get_caformer_s18 def get_clip_backbone(name="ViT-B/32") -> Tuple[torch.nn.Module, Compose]: Loading @@ -22,6 +22,7 @@ def register_backbone(name, func, *args, **kwargs): register_backbone('caformer', get_caformer) register_backbone('caformer_s18', get_caformer_s18) def get_backbone(name: str) -> Tuple[torch.nn.Module, Compose]: Loading
zoo/ccip/caformer.py +7 −0 Original line number Diff line number Diff line Loading @@ -32,3 +32,10 @@ def get_caformer(input_resolution: int = 384, heads: int = 8, feat_dims: int = 7 ] return CaformerBackbone(input_resolution, heads, feat_dims, **kwargs), transform def get_caformer_s18(input_resolution: int = 384, heads: int = 8, feat_dims: int = 768, **kwargs): transform = [ Normalize((0.48145466, 0.4578275, 0.40821073), (0.26862954, 0.26130258, 0.27577711)), ] return CaformerBackbone(input_resolution, heads, feat_dims, arch='caformer_s18_384_in21ft1k', **kwargs), transform No newline at end of file