[dc40d0]: / lavis / configs / models / clip_vit_large14.yaml

Download this file

53 lines (48 with data), 1.1 kB

 1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
# Copyright (c) 2022, salesforce.com, inc.
# All rights reserved.
# SPDX-License-Identifier: BSD-3-Clause
# For full license text, see the LICENSE file in the repo root or https://opensource.org/licenses/BSD-3-Clause
model:
arch: clip
model_type: ViT-L-14
# ['RN50',
# 'RN50-quickgelu',
# 'RN50x4',
# 'RN50x16',
# 'RN101',
# 'RN101-quickgelu',
# 'timm-efficientnetv2_rw_s',
# 'timm-resnet50d',
# 'timm-resnetaa50d',
# 'timm-resnetblur50',
# 'timm-swin_base_patch4_window7_224',
# 'timm-vit_base_patch16_224',
# 'timm-vit_base_patch32_224',
# 'timm-vit_small_patch16_224',
# 'ViT-B-16',
# 'ViT-B-16-plus',
# 'ViT-B-16-plus-240',
# 'ViT-B-32',
# 'ViT-B-32-plus-256',
# 'ViT-B-32-quickgelu',
# 'ViT-g-14',
# 'ViT-H-14',
# 'ViT-H-16',
# 'ViT-L-14',
# 'ViT-L-14-280',
# 'ViT-L-14-336',
# 'ViT-L-16',
# 'ViT-L-16-320']
pretrained: openai
# "openai"
# following not available for all models
# "yfcc15m"
# "cc12m"
# "laion400m_e31"
# "laion400m_e32"
# "laion400m_avg"
preprocess:
vis_processor:
eval:
name: "clip_image_eval"
image_size: 224