from tika import parser raw = parser.from_file('muenzkomplex_Split.pdf') print(raw['content']) with open("text_Output.txt", "w", encoding="utf-8") as out: out.writelines(raw['content'])