HugoLaurencon
commited on
Commit
•
22701ae
1
Parent(s):
c340078
correction of bug
Browse files
app.py
CHANGED
@@ -131,18 +131,20 @@ class Visualization:
|
|
131 |
else 0
|
132 |
)
|
133 |
label_selectbox = (
|
134 |
-
"Length of the repetitions (that will determine the repetitions ratio).
|
135 |
-
"Choosing a higher or lower number does not mean that the filtering "
|
136 |
-
"is stronger or weaker. Be careful, choosing a low number (below 5 for languages like English) "
|
137 |
-
"tends to associate a high repetitions ratio to very long documents (like book chapters), but with "
|
138 |
-
"few or no repetitions, simply because their length gives them more diversity, and we do "
|
139 |
-
"not want to discard such documents."
|
140 |
)
|
141 |
repetitions_length = st.sidebar.selectbox(
|
142 |
label=label_selectbox,
|
143 |
options=val_repetitions_lengths,
|
144 |
index=default_index,
|
145 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
146 |
self.docs = self.docs_checkpoint
|
147 |
for i in range(len(self.docs["repetitions_ratio"])):
|
148 |
self.docs["repetitions_ratio"].iloc[i] = self.docs["repetitions_ratio"].iloc[i][repetitions_length]
|
|
|
131 |
else 0
|
132 |
)
|
133 |
label_selectbox = (
|
134 |
+
"Length of the repetitions (that will determine the repetitions ratio)."
|
|
|
|
|
|
|
|
|
|
|
135 |
)
|
136 |
repetitions_length = st.sidebar.selectbox(
|
137 |
label=label_selectbox,
|
138 |
options=val_repetitions_lengths,
|
139 |
index=default_index,
|
140 |
)
|
141 |
+
st.sidebar.caption(
|
142 |
+
"Choosing a higher or lower number does not mean that the filtering "
|
143 |
+
"is stronger or weaker. Be careful, choosing a low number (below 5 for languages like English) "
|
144 |
+
"tends to associate a high repetitions ratio to very long documents (like book chapters), but with "
|
145 |
+
"few or no repetitions, simply because their length gives them more diversity, and we do "
|
146 |
+
"not want to discard such documents."
|
147 |
+
)
|
148 |
self.docs = self.docs_checkpoint
|
149 |
for i in range(len(self.docs["repetitions_ratio"])):
|
150 |
self.docs["repetitions_ratio"].iloc[i] = self.docs["repetitions_ratio"].iloc[i][repetitions_length]
|