Farid Karimli
commited on
Commit
·
2ce64aa
1
Parent(s):
e27870a
LLamaparser prompt
Browse files
code/modules/data_loader.py
CHANGED
@@ -54,7 +54,7 @@ class LlamaParser:
|
|
54 |
language="en",
|
55 |
gpt4o_mode=True,
|
56 |
gpt4o_api_key=OPENAI_API_KEY,
|
57 |
-
parsing_instruction="The provided documents are PDFs of lecture slides of deep learning material. They contain LaTeX equations, images, and text. The goal is to extract the text and equations from the slides and convert them to markdown format. The markdown should be clean and easy to read, and any math equation should be converted to LaTeX, between $$."
|
58 |
)
|
59 |
|
60 |
def parse(self, pdf_path):
|
|
|
54 |
language="en",
|
55 |
gpt4o_mode=True,
|
56 |
gpt4o_api_key=OPENAI_API_KEY,
|
57 |
+
parsing_instruction="The provided documents are PDFs of lecture slides of deep learning material. They contain LaTeX equations, images, and text. The goal is to extract the text, images and equations from the slides and convert them to markdown format. The markdown should be clean and easy to read, and any math equation should be converted to LaTeX, between $$. For images, give a description and if you can, a source."
|
58 |
)
|
59 |
|
60 |
def parse(self, pdf_path):
|