Reading multiple directories in transcript browser
This commit is contained in:
16
src/pdf_browser/read_pdf.py
Normal file
16
src/pdf_browser/read_pdf.py
Normal file
@@ -0,0 +1,16 @@
|
||||
import pypdf
|
||||
|
||||
reader = pypdf.PdfReader("C:/Users/Karol/Desktop/Hegels-Logic.pdf")
|
||||
|
||||
f = open("asd.txt", "w", encoding="utf-8")
|
||||
for i in range(len(reader.pages)):
|
||||
page = reader.pages[i]
|
||||
text = page.extract_text()
|
||||
text = text.replace("\n", "")
|
||||
text = text.replace("-", "")
|
||||
|
||||
f.write(f">>>>>>>>{i + 1}<<<<<<<<<\n")
|
||||
f.write(text)
|
||||
f.write("\n")
|
||||
|
||||
f.close()
|
||||
Reference in New Issue
Block a user