Farid Karimli
commited on
Commit
·
351c4c7
1
Parent(s):
229ace9
Buffered images for GPT4o mini
Browse files
code/modules/dataloader/pdf_readers/gpt.py
CHANGED
@@ -65,6 +65,7 @@ class GPTParser:
|
|
65 |
output += chunk_output + "\n---\n"
|
66 |
|
67 |
output = output.split("\n---\n")
|
|
|
68 |
|
69 |
documents = [
|
70 |
Document(
|
|
|
65 |
output += chunk_output + "\n---\n"
|
66 |
|
67 |
output = output.split("\n---\n")
|
68 |
+
output = [doc for doc in output if doc.strip() != ""]
|
69 |
|
70 |
documents = [
|
71 |
Document(
|