Spaces:
Runtime error
Runtime error
Commit
·
22701ae
1
Parent(s):
c340078
correction of bug
Browse files
app.py
CHANGED
|
@@ -131,18 +131,20 @@ class Visualization:
|
|
| 131 |
else 0
|
| 132 |
)
|
| 133 |
label_selectbox = (
|
| 134 |
-
"Length of the repetitions (that will determine the repetitions ratio).
|
| 135 |
-
"Choosing a higher or lower number does not mean that the filtering "
|
| 136 |
-
"is stronger or weaker. Be careful, choosing a low number (below 5 for languages like English) "
|
| 137 |
-
"tends to associate a high repetitions ratio to very long documents (like book chapters), but with "
|
| 138 |
-
"few or no repetitions, simply because their length gives them more diversity, and we do "
|
| 139 |
-
"not want to discard such documents."
|
| 140 |
)
|
| 141 |
repetitions_length = st.sidebar.selectbox(
|
| 142 |
label=label_selectbox,
|
| 143 |
options=val_repetitions_lengths,
|
| 144 |
index=default_index,
|
| 145 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 146 |
self.docs = self.docs_checkpoint
|
| 147 |
for i in range(len(self.docs["repetitions_ratio"])):
|
| 148 |
self.docs["repetitions_ratio"].iloc[i] = self.docs["repetitions_ratio"].iloc[i][repetitions_length]
|
|
|
|
| 131 |
else 0
|
| 132 |
)
|
| 133 |
label_selectbox = (
|
| 134 |
+
"Length of the repetitions (that will determine the repetitions ratio)."
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 135 |
)
|
| 136 |
repetitions_length = st.sidebar.selectbox(
|
| 137 |
label=label_selectbox,
|
| 138 |
options=val_repetitions_lengths,
|
| 139 |
index=default_index,
|
| 140 |
)
|
| 141 |
+
st.sidebar.caption(
|
| 142 |
+
"Choosing a higher or lower number does not mean that the filtering "
|
| 143 |
+
"is stronger or weaker. Be careful, choosing a low number (below 5 for languages like English) "
|
| 144 |
+
"tends to associate a high repetitions ratio to very long documents (like book chapters), but with "
|
| 145 |
+
"few or no repetitions, simply because their length gives them more diversity, and we do "
|
| 146 |
+
"not want to discard such documents."
|
| 147 |
+
)
|
| 148 |
self.docs = self.docs_checkpoint
|
| 149 |
for i in range(len(self.docs["repetitions_ratio"])):
|
| 150 |
self.docs["repetitions_ratio"].iloc[i] = self.docs["repetitions_ratio"].iloc[i][repetitions_length]
|