File size: 585 Bytes
60fc5e8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
import os
import pymupdf4llm


class PdfConverter:
    def __init__(self, pdf_file):
        self.pdf_file = pdf_file
        self.md_text = None

    def convert_to_markdown(self):
        self.md_text = pymupdf4llm.to_markdown(self.pdf_file)
        return self.md_text

    def save_markdown(self, output_file):
        with open(output_file, 'w') as file:
            file.write(self.md_text)

# Example usage
# pdf_file = os.path.join(os.getcwd(), "pdfs", "test.pdf")
# converter = PdfConverter(pdf_file)
# text = converter.convert_to_markdown()
# print(text)