Skip to content
Snippets Groups Projects

Save Dataset and DatasetElements in cache database

Merged Eva Bardou requested to merge save-dataset-db into main
All threads resolved!
1 file
+ 4
4
Compare changes
  • Side-by-side
  • Inline
@@ -336,7 +336,7 @@ class DatasetExtractor(DatasetWorker):
"""
logger.info(f"Inserting dataset ({dataset.id})")
with cache_database.atomic():
return CachedDataset.create(
self.cached_dataset = CachedDataset.create(
id=dataset.id,
name=dataset.name,
state=dataset.state,
@@ -347,11 +347,11 @@ class DatasetExtractor(DatasetWorker):
# Configure temporary storage for the dataset data (cache + images)
self.configure_storage()
splits = self.list_dataset_elements_per_split(dataset)
self.cached_dataset = self.insert_dataset(dataset)
# Insert dataset in cache database
self.insert_dataset(dataset)
# Iterate over given splits
for split_name, elements in splits:
for split_name, elements in self.list_dataset_elements_per_split(dataset):
casted_elements = list(map(_format_element, elements))
self.process_split(split_name, casted_elements)
Loading