correct logs formating for dataviewer
Browse files- climateqa/constants.py +1 -1
- climateqa/logging.py +16 -10
    	
        climateqa/constants.py
    CHANGED
    
    | @@ -97,7 +97,7 @@ DOCUMENT_METADATA_DEFAULT_VALUES = { | |
| 97 | 
             
                "content": "",
         | 
| 98 | 
             
                "reranking_score": 0.0,
         | 
| 99 | 
             
                "query_used_for_retrieval": "",
         | 
| 100 | 
            -
                "sources_used": [],
         | 
| 101 | 
             
                "question_used": "",
         | 
| 102 | 
             
                "index_used": ""
         | 
| 103 | 
             
            }
         | 
|  | |
| 97 | 
             
                "content": "",
         | 
| 98 | 
             
                "reranking_score": 0.0,
         | 
| 99 | 
             
                "query_used_for_retrieval": "",
         | 
| 100 | 
            +
                "sources_used": [""],
         | 
| 101 | 
             
                "question_used": "",
         | 
| 102 | 
             
                "index_used": ""
         | 
| 103 | 
             
            }
         | 
    	
        climateqa/logging.py
    CHANGED
    
    | @@ -7,7 +7,7 @@ import csv | |
| 7 | 
             
            import pandas as pd
         | 
| 8 | 
             
            import io
         | 
| 9 | 
             
            from typing import TypedDict, List
         | 
| 10 | 
            -
            from constants import DOCUMENT_METADATA_DEFAULT_VALUES
         | 
| 11 |  | 
| 12 |  | 
| 13 | 
             
            def serialize_docs(docs:list)->list:
         | 
| @@ -25,18 +25,24 @@ def serialize_docs(docs:list)->list: | |
| 25 | 
             
                """
         | 
| 26 | 
             
                new_docs = []
         | 
| 27 | 
             
                for doc in docs:
         | 
| 28 | 
            -
                     | 
| 29 | 
            -
                    new_doc | 
| 30 | 
            -
             | 
|  | |
|  | |
| 31 |  | 
| 32 | 
            -
                    #  | 
| 33 | 
            -
             | 
| 34 | 
            -
                    
         | 
| 35 | 
            -
                    # Copy each metadata field, using default if missing
         | 
| 36 | 
             
                    for field, default_value in DOCUMENT_METADATA_DEFAULT_VALUES.items():
         | 
| 37 | 
            -
                         | 
| 38 | 
            -
                        
         | 
|  | |
|  | |
|  | |
|  | |
| 39 | 
             
                    new_docs.append(new_doc)
         | 
|  | |
|  | |
|  | |
| 40 | 
             
                return new_docs
         | 
| 41 |  | 
| 42 | 
             
            ## AZURE LOGGING - DEPRECATED
         | 
|  | |
| 7 | 
             
            import pandas as pd
         | 
| 8 | 
             
            import io
         | 
| 9 | 
             
            from typing import TypedDict, List
         | 
| 10 | 
            +
            from climateqa.constants import DOCUMENT_METADATA_DEFAULT_VALUES
         | 
| 11 |  | 
| 12 |  | 
| 13 | 
             
            def serialize_docs(docs:list)->list:
         | 
|  | |
| 25 | 
             
                """
         | 
| 26 | 
             
                new_docs = []
         | 
| 27 | 
             
                for doc in docs:
         | 
| 28 | 
            +
                    # Make sure we have a clean doc format
         | 
| 29 | 
            +
                    new_doc = {
         | 
| 30 | 
            +
                        "page_content": doc.get("page_content", ""),
         | 
| 31 | 
            +
                        "metadata": {}
         | 
| 32 | 
            +
                    }
         | 
| 33 |  | 
| 34 | 
            +
                    # Ensure all metadata fields exist with defaults if missing
         | 
|  | |
|  | |
|  | |
| 35 | 
             
                    for field, default_value in DOCUMENT_METADATA_DEFAULT_VALUES.items():
         | 
| 36 | 
            +
                        new_value =  (doc.get("metadata", {}).get(field, default_value))
         | 
| 37 | 
            +
                        try:
         | 
| 38 | 
            +
                            new_doc["metadata"][field] = type(default_value)(new_value)
         | 
| 39 | 
            +
                        except:
         | 
| 40 | 
            +
                            new_doc["metadata"][field] = default_value
         | 
| 41 | 
            +
             | 
| 42 | 
             
                    new_docs.append(new_doc)
         | 
| 43 | 
            +
                    
         | 
| 44 | 
            +
                if new_docs == []:
         | 
| 45 | 
            +
                    new_docs = [{"page_content": "No documents found", "metadata": DOCUMENT_METADATA_DEFAULT_VALUES}]
         | 
| 46 | 
             
                return new_docs
         | 
| 47 |  | 
| 48 | 
             
            ## AZURE LOGGING - DEPRECATED
         | 

