diff --git a/app.py b/app.py index fc4ec45be2250f12b1ec597e572037781ca038dc..7ca97a82c830f5e279cc0c1b5c2d99ef00204230 100644 --- a/app.py +++ b/app.py @@ -35,26 +35,28 @@ def upload(): filename = secure_filename(file.filename) file_path = os.path.join(Path(SLIDE_DIR), filename) file.save(file_path) - pdf = pdfplumber.load(file) + pdf = pdfplumber.open(file_path) index = SearchIndex() for i, page in enumerate(pdf.pages): text = page.extract_text() index.add(str(file_path), i, text) + img_name = str(file_path)[7:] + "_" + str(i) + ".jpg" + img_path = os.path.join(IMAGE_DIR, img_name) + page.to_image().save(img_path) del index return redirect('/') - @app.route("/query") def query(): try: index = SearchIndex() query = request.args.get("query") result = index.search(query) - pdf = pdfplumber.open(result["path"]) - page = pdf.pages[result["page"]] + #pdf = pdfplumber.open(result["path"]) + #page = pdf.pages[result["page"]] img_name = result["path"][7:] + "_" + str(result["page"]) + ".jpg" - img_path = os.path.join(IMAGE_DIR, img_name) - page.to_image().save(img_path) + #img_path = os.path.join(IMAGE_DIR, img_name) + #page.to_image().save(img_path) return "slide/" + img_name except: return str(sys.exc_info()[0]).replace("<", "-").replace(">", "-")