Farid Karimli commited on
Commit
351c4c7
1 Parent(s): 229ace9

Buffered images for GPT4o mini

Browse files
code/modules/dataloader/pdf_readers/gpt.py CHANGED
@@ -65,6 +65,7 @@ class GPTParser:
65
  output += chunk_output + "\n---\n"
66
 
67
  output = output.split("\n---\n")
 
68
 
69
  documents = [
70
  Document(
 
65
  output += chunk_output + "\n---\n"
66
 
67
  output = output.split("\n---\n")
68
+ output = [doc for doc in output if doc.strip() != ""]
69
 
70
  documents = [
71
  Document(