File size: 5,927 Bytes
401fa20
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
import os as __os  # add "__" if not want to be exported
from copy import deepcopy as __deepcopy

#data_dir = f'{VL_DATA_DIR}'
data_dir = '/ssdstore/fmthoker/videos_images/'
if data_dir is None:
    raise ValueError("please set environment `VL_DATA_DIR` before continue")


#data_root = __os.path.join(data_dir, "videos_images")
#anno_root_pt = __os.path.join(data_dir, "anno_pretrain")
#anno_root_downstream = __os.path.join(data_dir, "anno_downstream")
data_root = data_dir
anno_root_pt = __os.path.join("/ssdstore/fmthoker/videos_images/", "anno_pretrain")
anno_root_downstream = __os.path.join("/ssdstore/fmthoker/videos_images/", "anno_downstream")

# ============== pretraining datasets=================
available_corpus = dict(
    # pretraining datasets
    cc3m=[
        f"{anno_root_pt}/cc3m_train.json", 
        "{your_data_root}"
    ],
    cc12m=[
        f"{anno_root_pt}/cc12m_train.json", 
        "{your_data_root}"
    ],
    sbu=[
        f"{anno_root_pt}/sbu.json", 
        "{your_data_root}"
    ],
    vg=[
        f"{anno_root_pt}/vg.json", 
        "{your_data_root}"
    ],
    coco=[
        f"{anno_root_pt}/coco.json", 
        "{your_data_root}"
    ],
    imagenet1k=[
        f"{anno_root_pt}/imagenet1k_train.json", 
        "{your_data_root}"
    ],
    webvid=[
        f"{anno_root_pt}/webvid_train.json", 
        "{your_data_root}",
        "video"
    ],
    webvid_10m=[
        f"{anno_root_pt}/webvid_10m_train.json",
        "{your_data_root}",
        "video",
    ],
    kinetics400=[
        f"{anno_root_pt}/kinetics400_train.json",
        "{your_data_root}",
        "video",
    ],
    kinetics710=[
        f"{anno_root_pt}/kinetics710_train.json",
        "{your_data_root}",
        "video",
    ],
    kinetics710_raw=[
        f"{anno_root_pt}/kinetics710_raw_train.json",
        "{your_data_root}",
        "only_video",
    ],
    internvid_10m_flt=[  
        #f"{anno_root_pt}/internvid_10m_flt.json",
        #f"/ibex/project/c2134/InternVid-10M-FLT/internvid_10m_flt.json",
        #"/ibex/project/c2134/InternVid-10M-FLT/vd-foundation___InternVid-10M-FLT/raw/InternVId-FLT_1/",
        f"/ibex/project/c2134/InternVid-10M-FLT/vd-foundation___InternVid-10M-FLT/annotations/internvid_10m_flt.json", 
        f"/ibex/project/c2134/InternVid-10M-FLT/vd-foundation___InternVid-10M-FLT/videos/",
         "video"
    ],
    internvid_300k_flt=[  
        f"/ibex/project/c2134/InternVid-10M-FLT/vd-foundation___InternVid-10M-FLT/annotations/internvid_300k_subset1.json", 
        f"/ibex/project/c2134/InternVid-10M-FLT/vd-foundation___InternVid-10M-FLT/videos/",
         "video"
    ],
    mad_300k=[  
        f"/ibex/project/c2134/Fida/MAD/annotations/v2/MAD_train_viclip.json", 
        f"/ibex/project/c2134/Fida/MAD/data/folder_pre_shards",
         "video"
    ],
    mad_100k=[  
        f"/ibex/project/c2134/Fida/MAD/annotations/v2/MAD_train_viclip_100k.json", 
        f"/ibex/project/c2134/Fida/MAD/data/folder_pre_shards",
         "video"
    ],
)

# composed datasets.
available_corpus["coco_vg"] = [available_corpus["coco"], available_corpus["vg"]]
available_corpus["in1k_k710"] = [
    available_corpus["imagenet1k"],
    available_corpus["kinetics710"],
]
available_corpus["webvid_cc3m"] = [available_corpus["webvid"], available_corpus["cc3m"]]
available_corpus["webvid_cc3m_in1k_k710"] = [
    available_corpus["webvid"], 
    available_corpus["cc3m"],
    available_corpus["imagenet1k"],
    available_corpus["kinetics710"],
]
available_corpus["webvid_cc3m_k710raw"] = [
    available_corpus["webvid"], 
    available_corpus["cc3m"],
    available_corpus["kinetics710_raw"],
]
available_corpus["webvid_14m"] = [
    available_corpus["webvid"],
    available_corpus["cc3m"],
    available_corpus["coco"],
    available_corpus["vg"],
    available_corpus["sbu"],
    available_corpus["cc12m"],
]
available_corpus["webvid12m_14m"] = [
    available_corpus["webvid"],
    available_corpus["webvid_10m"],
    available_corpus["cc3m"],
    available_corpus["coco"],
    available_corpus["vg"],
    available_corpus["sbu"],
    available_corpus["cc12m"],
]
available_corpus["webvid10m_14m"] = [
    available_corpus["webvid_10m"],
    available_corpus["cc3m"],
    available_corpus["coco"],
    available_corpus["vg"],
    available_corpus["sbu"],
    available_corpus["cc12m"],
]
available_corpus["simple_17m"] = [
    available_corpus["webvid"],
    available_corpus["cc3m"],
    available_corpus["cc12m"],
]
available_corpus["simple_25m"] = [
    available_corpus["webvid_10m"],
    available_corpus["cc3m"],
    available_corpus["cc12m"],
]
available_corpus["viclip_20m"] = [
    available_corpus["internvid_10m_flt"],
    available_corpus["webvid_10m"],
]
available_corpus["viclip"] = [
    available_corpus["internvid_10m_flt"],
]
available_corpus["viclip_mad_300k"] = [
    available_corpus["mad_300k"],
]
available_corpus["viclip_mad_100k"] = [
    available_corpus["mad_100k"],
]
available_corpus["viclip_internvid_300k"] = [
    available_corpus["internvid_300k_flt"],
]

# ============== for validation =================
available_corpus["msrvtt_1k_test"] = [
    f"{anno_root_downstream}/msrvtt_test1k.json",
    f"{data_root}/msrvtt_2fps_224",
    "video",
]
available_corpus["k400_act_val"] = [
    f"{anno_root_downstream}/kinetics400_validate.json",
    "{your_data_root}",
    "video",
]
available_corpus["k600_act_val"] = [
    f"{anno_root_downstream}/kinetics600_validate.json",
    "{your_data_root}",
    "video",
]
available_corpus["k700_act_val"] = [
    f"{anno_root_downstream}/kinetics700_validate.json",
    "{your_data_root}",
    "video",
]
available_corpus["sthsthv1_act_val"] = [
    f"{anno_root_downstream}/sthsthv1_validate_clean2.json",
    "{your_data_root}",
    "video",
]
available_corpus["sthsthv2_act_val"] = [
    f"{anno_root_downstream}/sthsthv2_validate_clean2.json",
    "{your_data_root}",
    "video",
]