-
Notifications
You must be signed in to change notification settings - Fork 47
/
Copy pathfastaidatasets.jl
126 lines (111 loc) · 5.4 KB
/
fastaidatasets.jl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
struct FastAIDataset
name
subfolder
extension
description
checksum
datadepname
size
end
const ROOT_URL = "https://s3.amazonaws.com/fast-ai-"
function FastAIDataset(
name, subfolder, checksum = ""; extension = "tgz", description = "", datadepname = name, size = "???")
return FastAIDataset(name, subfolder, extension, description, checksum, datadepname, size)
end
const DATASETCONFIGS = [
# imageclas
FastAIDataset("CUB_200_2011", "imageclas"),
FastAIDataset("bedroom", "imageclas"),
FastAIDataset("caltech_101", "imageclas"),
FastAIDataset("cifar10", "imageclas", "637c5814e11aefcb6ee76d5f59c67ddc8de7f5b5077502a195b0833d1e3e4441"),
FastAIDataset("cifar100", "imageclas", "085ac613ceb0b3659c8072143ae553d5dd146b3c4206c3672a56ed02d0e77d28"),
FastAIDataset("food-101", "imageclas"),
FastAIDataset("imagenette-160", "imageclas"),
FastAIDataset("imagenette-320", "imageclas"),
FastAIDataset("imagenette", "imageclas"),
FastAIDataset("imagenette2-160", "imageclas", "88daccb09b6fce93f45e6c09ddeb269cce705549e6bff322092a2a5a11489863"),
FastAIDataset("imagenette2-320", "imageclas", "569b4497c98db6dd29f335d1f109cf315fe127053cedf69010d047f0188e158c"),
FastAIDataset("imagenette2", "imageclas"),
FastAIDataset("imagewang-160", "imageclas"),
FastAIDataset("imagewang-320", "imageclas"),
FastAIDataset("imagewang", "imageclas"),
FastAIDataset("imagewoof-160", "imageclas"),
FastAIDataset("imagewoof-320", "imageclas"),
FastAIDataset("imagewoof", "imageclas"),
FastAIDataset("imagewoof2-160", "imageclas", "663c22f69c2802d85e2a67103c017e047096702ffddf9149a14011b7002539bf"),
FastAIDataset("imagewoof2-320", "imageclas"),
FastAIDataset("imagewoof2", "imageclas"),
FastAIDataset("mnist_png", "imageclas", "9e18edaa3a08b065d8f80a019ca04329e6d9b3e391363414a9bd1ada30563672"),
FastAIDataset("mnist_var_size_tiny", "imageclas", "8a0f6ca04c2d31810dc08e739c7fa9b612e236383f70dd9fc6e5a62e672e2283"),
FastAIDataset("oxford-102-flowers", "imageclas"),
FastAIDataset("oxford-iiit-pet", "imageclas"),
FastAIDataset("stanford-cars", "imageclas"),
# nlp
FastAIDataset("ag_news_csv", "nlp"),
FastAIDataset("amazon_review_full_csv", "nlp"),
FastAIDataset("amazon_review_polarity_csv", "nlp"),
FastAIDataset("dbpedia_csv", "nlp"),
FastAIDataset("giga-fren", "nlp"),
FastAIDataset("imdb", "nlp"),
FastAIDataset("sogou_news_csv", "nlp"),
FastAIDataset("wikitext-103", "nlp"),
FastAIDataset("wikitext-2", "nlp"),
FastAIDataset("yahoo_answers_csv", "nlp"),
FastAIDataset("yelp_review_full_csv", "nlp"),
FastAIDataset("yelp_review_polarity_csv", "nlp"),
# imagelocal
FastAIDataset("biwi_head_pose", "imagelocal"),
FastAIDataset("camvid", "imagelocal"),
FastAIDataset("pascal-voc", "imagelocal"),
FastAIDataset("pascal_2007", "imagelocal"),
FastAIDataset("pascal_2012", "imagelocal"),
FastAIDataset("siim_small", "imagelocal"),
FastAIDataset("skin-lesion", "imagelocal"),
FastAIDataset("tcga-small", "imagelocal"),
# sample
FastAIDataset("adult_sample", "sample"),
FastAIDataset("biwi_sample", "sample"),
FastAIDataset("camvid_tiny", "sample", "cd42a9bdd8ad3e0ce87179749beae05b4beb1ae6ab665841180b1d8022fc230b"),
FastAIDataset("dogscats", "sample"),
FastAIDataset("human_numbers", "sample"),
FastAIDataset("imdb_sample", "sample"),
FastAIDataset("mnist_sample", "sample"),
FastAIDataset("mnist_tiny", "sample"),
FastAIDataset("movie_lens_sample", "sample"),
FastAIDataset("planet_sample", "sample"),
FastAIDataset("planet_tiny", "sample"),
# coco
FastAIDataset("coco_sample", "coco", "56960c0ac09ff35cd8588823d37e1ed0954cb88b8bfbd214a7763e72f982911c", size = "3GB"),
FastAIDataset("train2017", "coco", datadepname="coco-train2017", extension="zip"),
FastAIDataset("val2017", "coco", datadepname="coco-val2017", extension="zip"),
FastAIDataset("test2017", "coco", datadepname="coco-test2017", extension="zip"),
FastAIDataset("unlabeled2017", "coco", datadepname="coco-unlabeled2017", extension="zip"),
FastAIDataset("image_info_test2017", "coco", datadepname="coco-image_info_test2017", extension="zip"),
FastAIDataset("image_info_unlabeled2017", "coco", datadepname="coco-image_info_unlabeled2017", extension="zip"),
FastAIDataset("annotations_trainval2017", "coco", datadepname="coco-annotations_trainval2017", extension="zip"),
FastAIDataset("stuff_annotations_trainval2017", "coco", datadepname="coco-stuff_annotations_trainval2017", extension="zip"),
FastAIDataset("panoptic_annotations_trainval2017", "coco", datadepname="coco-panoptic_annotations_trainval2017", extension="zip"),
]
const DATASETS = [d.datadepname for d in DATASETCONFIGS]
const DATASETS_IMAGECLASSIFICATION = vcat(
[d.datadepname for d in DATASETCONFIGS if d.subfolder == "imageclas"],
["mnist_sample", "mnist_tiny", "dogscats"],
)
function DataDeps.DataDep(d::FastAIDataset)
return DataDep(
"fastai-$(d.datadepname)",
"""
"$(d.name)" from the fastai dataset repository (https://course.fast.ai/datasets)
$(d.description)
Download size: $(d.size)
""",
"$(ROOT_URL)$(d.subfolder)/$(d.name).$(d.extension)",
d.checksum,
post_fetch_method = DataDeps.unpack,
)
end
function initdatadeps()
for d in DATASETCONFIGS
DataDeps.register(DataDep(d))
end
end