Skip to content

Commit

Permalink
adjust to new readers for csv
Browse files Browse the repository at this point in the history
Signed-off-by: dafnapension <[email protected]>
  • Loading branch information
dafnapension committed Jan 23, 2025
1 parent df9c1e1 commit db4e827
Show file tree
Hide file tree
Showing 2 changed files with 9 additions and 5 deletions.
10 changes: 7 additions & 3 deletions src/unitxt/loaders.py
Original file line number Diff line number Diff line change
Expand Up @@ -447,9 +447,13 @@ def load_iterables(self):
return iterables

def split_generator(self, split: str) -> Generator:
dataset = pd.read_csv(
self.files[split], nrows=self.get_limit(), sep=self.sep
).to_dict("records")
dataset = self.__class__._loader_cache.get(str(self) + "_" + split, None)
if dataset is None:
reader = self.get_reader()
dataset = reader(self.files[split], **self.get_args()).to_dict("records")
self.__class__._loader_cache.max_size = settings.loader_cache_size
self.__class__._loader_cache[str(self) + "_" + split] = dataset

yield from dataset


Expand Down
4 changes: 2 additions & 2 deletions utils/.secrets.baseline
Original file line number Diff line number Diff line change
Expand Up @@ -151,7 +151,7 @@
"filename": "src/unitxt/loaders.py",
"hashed_secret": "840268f77a57d5553add023cfa8a4d1535f49742",
"is_verified": false,
"line_number": 595,
"line_number": 599,
"is_secret": false
}
],
Expand Down Expand Up @@ -184,5 +184,5 @@
}
]
},
"generated_at": "2025-01-23T12:43:28Z"
"generated_at": "2025-01-23T13:22:15Z"
}

0 comments on commit db4e827

Please sign in to comment.