diff --git a/slide_indexer/basic_indexer.py b/slide_indexer/basic_indexer.py index bf9a2b9384f3907737806e232e7e13fa38445e49..e10a942733988539b05187d8c0f1cd5f084be4e7 100644 --- a/slide_indexer/basic_indexer.py +++ b/slide_indexer/basic_indexer.py @@ -20,8 +20,8 @@ class BasicIndexer(): pdf_file_name = pdf_file_path.split(os.sep)[-1] for i, page in enumerate(pdf.pages): text = page.extract_text() - self.index.add(pdf_file_name, i, text, text.split("\n")[self.title_row]) + self.index.add(pdf_file_name, i + 1, text, text.split("\n")[self.title_row]) if self.process_images: - img_name = pdf_file_name + "_" + str(i) + ".jpg" + img_name = pdf_file_name + "_" + str(i + 1) + ".jpg" img_path = os.path.join(self.image_dir, img_name) page.to_image().save(img_path)