-
Notifications
You must be signed in to change notification settings - Fork 152
/
Copy pathwrap_few_shot_dataset.py
69 lines (60 loc) · 2.5 KB
/
wrap_few_shot_dataset.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
from typing import List, Tuple
from torch import Tensor
from torch.utils.data import Dataset
from tqdm import tqdm
from .few_shot_dataset import FewShotDataset
class WrapFewShotDataset(FewShotDataset):
"""
Wrap a dataset in a FewShotDataset. This is useful if you have your own dataset
and want to use it with the tools provided by EasyFSL such as TaskSampler.
"""
def __init__(
self,
dataset: Dataset,
image_position_in_get_item_output: int = 0,
label_position_in_get_item_output: int = 1,
):
"""
Wrap a dataset in a FewShotDataset.
Args:
dataset: dataset to wrap
image_position_in_get_item_output: position of the image in the tuple returned
by dataset.__getitem__(). Default: 0
label_position_in_get_item_output: position of the label in the tuple returned
by dataset.__getitem__(). Default: 1
"""
if image_position_in_get_item_output == label_position_in_get_item_output:
raise ValueError(
"image_position_in_get_item_output and label_position_in_get_item_output must be different."
)
if (
image_position_in_get_item_output < 0
or label_position_in_get_item_output < 0
):
raise ValueError(
"image_position_in_get_item_output and label_position_in_get_item_output must be positive."
)
item_length = len(dataset[0])
if (
image_position_in_get_item_output >= item_length
or label_position_in_get_item_output >= item_length
):
raise ValueError("Specified positions in output are out of range.")
self.source_dataset = dataset
self.labels = [
source_dataset_instance[label_position_in_get_item_output]
for source_dataset_instance in tqdm(
dataset, desc="Scrolling dataset's labels..."
)
]
self.image_position_in_get_item_output = image_position_in_get_item_output
self.label_position_in_get_item_output = label_position_in_get_item_output
def __getitem__(self, item: int) -> Tuple[Tensor, int]:
return (
self.source_dataset[item][self.image_position_in_get_item_output],
self.source_dataset[item][self.label_position_in_get_item_output],
)
def __len__(self) -> int:
return len(self.labels)
def get_labels(self) -> List[int]:
return self.labels