correct logs formating for dataviewer
Browse files- climateqa/constants.py +1 -1
- climateqa/logging.py +16 -10
climateqa/constants.py
CHANGED
|
@@ -97,7 +97,7 @@ DOCUMENT_METADATA_DEFAULT_VALUES = {
|
|
| 97 |
"content": "",
|
| 98 |
"reranking_score": 0.0,
|
| 99 |
"query_used_for_retrieval": "",
|
| 100 |
-
"sources_used": [],
|
| 101 |
"question_used": "",
|
| 102 |
"index_used": ""
|
| 103 |
}
|
|
|
|
| 97 |
"content": "",
|
| 98 |
"reranking_score": 0.0,
|
| 99 |
"query_used_for_retrieval": "",
|
| 100 |
+
"sources_used": [""],
|
| 101 |
"question_used": "",
|
| 102 |
"index_used": ""
|
| 103 |
}
|
climateqa/logging.py
CHANGED
|
@@ -7,7 +7,7 @@ import csv
|
|
| 7 |
import pandas as pd
|
| 8 |
import io
|
| 9 |
from typing import TypedDict, List
|
| 10 |
-
from constants import DOCUMENT_METADATA_DEFAULT_VALUES
|
| 11 |
|
| 12 |
|
| 13 |
def serialize_docs(docs:list)->list:
|
|
@@ -25,18 +25,24 @@ def serialize_docs(docs:list)->list:
|
|
| 25 |
"""
|
| 26 |
new_docs = []
|
| 27 |
for doc in docs:
|
| 28 |
-
|
| 29 |
-
new_doc
|
| 30 |
-
|
|
|
|
|
|
|
| 31 |
|
| 32 |
-
#
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
# Copy each metadata field, using default if missing
|
| 36 |
for field, default_value in DOCUMENT_METADATA_DEFAULT_VALUES.items():
|
| 37 |
-
|
| 38 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
| 39 |
new_docs.append(new_doc)
|
|
|
|
|
|
|
|
|
|
| 40 |
return new_docs
|
| 41 |
|
| 42 |
## AZURE LOGGING - DEPRECATED
|
|
|
|
| 7 |
import pandas as pd
|
| 8 |
import io
|
| 9 |
from typing import TypedDict, List
|
| 10 |
+
from climateqa.constants import DOCUMENT_METADATA_DEFAULT_VALUES
|
| 11 |
|
| 12 |
|
| 13 |
def serialize_docs(docs:list)->list:
|
|
|
|
| 25 |
"""
|
| 26 |
new_docs = []
|
| 27 |
for doc in docs:
|
| 28 |
+
# Make sure we have a clean doc format
|
| 29 |
+
new_doc = {
|
| 30 |
+
"page_content": doc.get("page_content", ""),
|
| 31 |
+
"metadata": {}
|
| 32 |
+
}
|
| 33 |
|
| 34 |
+
# Ensure all metadata fields exist with defaults if missing
|
|
|
|
|
|
|
|
|
|
| 35 |
for field, default_value in DOCUMENT_METADATA_DEFAULT_VALUES.items():
|
| 36 |
+
new_value = (doc.get("metadata", {}).get(field, default_value))
|
| 37 |
+
try:
|
| 38 |
+
new_doc["metadata"][field] = type(default_value)(new_value)
|
| 39 |
+
except:
|
| 40 |
+
new_doc["metadata"][field] = default_value
|
| 41 |
+
|
| 42 |
new_docs.append(new_doc)
|
| 43 |
+
|
| 44 |
+
if new_docs == []:
|
| 45 |
+
new_docs = [{"page_content": "No documents found", "metadata": DOCUMENT_METADATA_DEFAULT_VALUES}]
|
| 46 |
return new_docs
|
| 47 |
|
| 48 |
## AZURE LOGGING - DEPRECATED
|