Commit 4576b4ca authored by Nicolas Atrax's avatar Nicolas Atrax

Update PDFtoTXT.py

parent ccaa047c
......@@ -4,6 +4,7 @@ from lib.tika.tika import parser
from datetime import date
from lib.pdfminer.pdfminer.pdfparser import PDFParser
from lib.pdfminer.pdfminer.pdfdocument import PDFDocument
os.environ['TIKA_SERVER_JAR'] = 'https://repo1.maven.org/maven2/org/apache/tika/tika-server/1.19/tika-server-1.19.jar'
def replaceNewlines(txt):
tmp = txt.split("\n")
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment