Spaces:

lfoppiano
/

document-qa

Running

App Files Files Community

lfoppiano commited on Jan 20, 2024

Commit

66819b5

1 Parent(s): c07b97b

fix coordinates colors when working with chunks

Browse files

Files changed (2) hide show

document_qa/document_qa_engine.py +0 -2
streamlit_app.py +15 -10

document_qa/document_qa_engine.py CHANGED Viewed

@@ -63,8 +63,6 @@ class TextMerger:
                 new_coordinates.append(current_coordinates)
                 current_texts = []
                 current_coordinates = []
-            else:
-                print("bao")
         if len(current_texts) > 0:
             new_passages.append(current_texts)

                 new_coordinates.append(current_coordinates)
                 current_texts = []
                 current_coordinates = []
         if len(current_texts) > 0:
             new_passages.append(current_texts)

streamlit_app.py CHANGED Viewed

@@ -430,16 +430,14 @@ with right_column:
                 _, text_response, coordinates = st.session_state['rqa'][model].query_document(question,
                                                                                               st.session_state.doc_id,
                                                                                               context_size=context_size)
-                annotations = [
-                    GrobidAggregationProcessor.box_to_dict(coo) for coo in [c.split(",") for coord in
-                                                                            coordinates for c in coord]
-                ]
                 gradients = generate_color_gradient(len(annotations))
                 for i, color in enumerate(gradients):
-                    annotations[i]['color'] = color
-                st.session_state['annotations'] = annotations
-                # with left_column:
-                #     pdf_viewer(input=st.session_state['binary'], annotations=st.session_state['annotations'], key=1)
         if not text_response:
             st.error("Something went wrong. Contact Luca Foppiano (Foppiano.Luca@nims.co.jp) to report the issue.")
@@ -470,7 +468,14 @@ with right_column:
 with left_column:
     if st.session_state['binary']:
         if st.session_state['should_show_annotations']:
-            pdf_viewer(input=st.session_state['binary'], width=600, height=800,
                        annotations=st.session_state['annotations'])
         else:
-            pdf_viewer(input=st.session_state['binary'], width=600, height=800)

                 _, text_response, coordinates = st.session_state['rqa'][model].query_document(question,
                                                                                               st.session_state.doc_id,
                                                                                               context_size=context_size)
+                annotations = [[GrobidAggregationProcessor.box_to_dict([cs for cs in c.split(",")]) for c in coord_doc]
+                               for coord_doc in coordinates]
                 gradients = generate_color_gradient(len(annotations))
                 for i, color in enumerate(gradients):
+                    for annotation in annotations[i]:
+                        annotation['color'] = color
+                st.session_state['annotations'] = [annotation for annotation_doc in annotations for annotation in annotation_doc]
         if not text_response:
             st.error("Something went wrong. Contact Luca Foppiano (Foppiano.Luca@nims.co.jp) to report the issue.")
 with left_column:
     if st.session_state['binary']:
         if st.session_state['should_show_annotations']:
+            pdf_viewer(input=st.session_state['binary'],
+                       width=600,
+                       height=800,
+                       annotation_outline_size=2,
                        annotations=st.session_state['annotations'])
         else:
+            pdf_viewer(input=st.session_state['binary'],
+                       width=600,
+                       height=800,
+                       annotation_outline_size=2
+                       )