From 93a231a477f3a7f74aa661ebe7c817060dd11ceb Mon Sep 17 00:00:00 2001 From: mkozlowskiAzimuthe Date: Wed, 25 Jan 2023 18:06:04 +0100 Subject: [PATCH] print --- utils/donut_dataset_stream.py | 1 + 1 file changed, 1 insertion(+) diff --git a/utils/donut_dataset_stream.py b/utils/donut_dataset_stream.py index f295c8d..e10a0fa 100644 --- a/utils/donut_dataset_stream.py +++ b/utils/donut_dataset_stream.py @@ -48,6 +48,7 @@ class DonutDataset(Dataset): self.added_tokens = added_tokens self.dataset = load_dataset(dataset_name_or_path, split=self.split, streaming=True).with_format("torch") + print(self.dataset) self.dataset_length = len(self.dataset) self.gt_token_sequences = []