Spaces:

pleonova
/

multi-label-summary-text

Running

App Files Files Community

Paula Leonova commited on Feb 16, 2022

Commit

c0937ef

1 Parent(s): 43481f8

Update how ground truth label is uploaded for multiple texts

Browse files

Files changed (1) hide show

app.py +21 -15

app.py CHANGED Viewed

@@ -81,16 +81,16 @@ with st.form(key='my_form'):
     glabels = list(set([x.strip() for x in glabels.strip().split(',') if len(x.strip()) > 0]))
-    # glabels_csv_expander = st.expander(label=f'Have a file with labels for the text? Click here to upload your CSV file.', expanded=False)
-    # with glabels_csv_expander:
-    #     st.markdown('##### Choose one of the options below:')
-    #     st.write("__Option A:__")
-    #     uploaded_onetext_glabels_file = st.file_uploader("Single Text: Choose a CSV file with one column and no header, where each cell is a separate label",
-    #                                                      key = 'onetext_glabels_uploader')
-    #     st.write("__Option B:__")
-    #     uploaded_multitext_glabels_file = st.file_uploader('Multiple Text: Choose a CSV file with two columns "title" and "label", with the cells in the title column matching the name of the files uploaded in step #1.',
-    #                                                        key = 'multitext_glabels_uploader')
-    #
     # threshold_value = st.slider(
@@ -280,12 +280,19 @@ if submit_button or example_button:
             else:
                 label_match_df = labels_full_df.copy()
-            # TO DO: ADD Flexibility for csv import and multiple texts
             if len(glabels) > 0:
                 gdata = pd.DataFrame({'label': glabels})
                 gdata['correct_match'] = True
-                label_match_df = pd.merge(label_match_df, gdata, how = 'left', on = ['label'])
                 label_match_df['correct_match'].fillna(False, inplace=True)
             st.dataframe(label_match_df)
@@ -296,7 +303,6 @@ if submit_button or example_button:
                 mime='title_label_sum_full/csv',
             )
             # if len(glabels) > 0:
             #     st.markdown("### Evaluation Metrics")
             #     with st.spinner('Evaluating output against ground truth...'):
@@ -313,4 +319,4 @@ if submit_button or example_button:
             #             st.dataframe(df_report)
         st.success('All done!')
-        # st.balloons()

     glabels = list(set([x.strip() for x in glabels.strip().split(',') if len(x.strip()) > 0]))
+    glabels_csv_expander = st.expander(label=f'Have a file with labels for the text? Click here to upload your CSV file.', expanded=False)
+    with glabels_csv_expander:
+        st.markdown('##### Choose one of the options below:')
+        st.write("__Option A:__")
+        uploaded_onetext_glabels_file = st.file_uploader("Single Text: Choose a CSV file with one column and no header, where each cell is a separate label",
+                                                         key = 'onetext_glabels_uploader')
+        st.write("__Option B:__")
+        uploaded_multitext_glabels_file = st.file_uploader('Multiple Text: Choose a CSV file with two columns "title" and "label", with the cells in the title column matching the name of the files uploaded in step #1.',
+                                                           key = 'multitext_glabels_uploader')
     # threshold_value = st.slider(
             else:
                 label_match_df = labels_full_df.copy()
             if len(glabels) > 0:
                 gdata = pd.DataFrame({'label': glabels})
+                join_list = ['label']
+            elif uploaded_onetext_glabels_file is not None:
+                gdata = pd.read_csv(uploaded_onetext_glabels_file, header=None)
+                join_list = ['label']
+            elif uploaded_multitext_glabels_file is not None:
+                gdata = pd.read_csv(uploaded_multitext_glabels_file)
+                join_list = ['title', 'label']
+            if len(glabels) > 0 or uploaded_onetext_glabels_file is not None or uploaded_multitext_glabels_file is not None:
                 gdata['correct_match'] = True
+                label_match_df = pd.merge(label_match_df, gdata, how='outer', on=join_list)
                 label_match_df['correct_match'].fillna(False, inplace=True)
             st.dataframe(label_match_df)
                 mime='title_label_sum_full/csv',
             )
             # if len(glabels) > 0:
             #     st.markdown("### Evaluation Metrics")
             #     with st.spinner('Evaluating output against ground truth...'):
             #             st.dataframe(df_report)
         st.success('All done!')
+        st.balloons()