[8956d4]: / unimol / data / key_dataset.py

Download this file

29 lines (21 with data), 751 Bytes

 1
 2
 3
 4
 5
 6
 7
 8
 9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
# Copyright (c) DP Technology.
# This source code is licensed under the MIT license found in the
# LICENSE file in the root directory of this source tree.
from functools import lru_cache
from unicore.data import BaseWrapperDataset
class KeyDataset(BaseWrapperDataset):
def __init__(self, dataset, key):
self.dataset = dataset
self.key = key
def __len__(self):
return len(self.dataset)
@lru_cache(maxsize=16)
def __getitem__(self, idx):
return self.dataset[idx][self.key]
class LengthDataset(BaseWrapperDataset):
def __init__(self, dataset):
super().__init__(dataset)
@lru_cache(maxsize=16)
def __getitem__(self, idx):
item = self.dataset[idx]
return len(item)