HugoLaurencon HF staff commited on
Commit
22701ae
1 Parent(s): c340078

correction of bug

Browse files
Files changed (1) hide show
  1. app.py +8 -6
app.py CHANGED
@@ -131,18 +131,20 @@ class Visualization:
131
  else 0
132
  )
133
  label_selectbox = (
134
- "Length of the repetitions (that will determine the repetitions ratio). "
135
- "Choosing a higher or lower number does not mean that the filtering "
136
- "is stronger or weaker. Be careful, choosing a low number (below 5 for languages like English) "
137
- "tends to associate a high repetitions ratio to very long documents (like book chapters), but with "
138
- "few or no repetitions, simply because their length gives them more diversity, and we do "
139
- "not want to discard such documents."
140
  )
141
  repetitions_length = st.sidebar.selectbox(
142
  label=label_selectbox,
143
  options=val_repetitions_lengths,
144
  index=default_index,
145
  )
 
 
 
 
 
 
 
146
  self.docs = self.docs_checkpoint
147
  for i in range(len(self.docs["repetitions_ratio"])):
148
  self.docs["repetitions_ratio"].iloc[i] = self.docs["repetitions_ratio"].iloc[i][repetitions_length]
131
  else 0
132
  )
133
  label_selectbox = (
134
+ "Length of the repetitions (that will determine the repetitions ratio)."
 
 
 
 
 
135
  )
136
  repetitions_length = st.sidebar.selectbox(
137
  label=label_selectbox,
138
  options=val_repetitions_lengths,
139
  index=default_index,
140
  )
141
+ st.sidebar.caption(
142
+ "Choosing a higher or lower number does not mean that the filtering "
143
+ "is stronger or weaker. Be careful, choosing a low number (below 5 for languages like English) "
144
+ "tends to associate a high repetitions ratio to very long documents (like book chapters), but with "
145
+ "few or no repetitions, simply because their length gives them more diversity, and we do "
146
+ "not want to discard such documents."
147
+ )
148
  self.docs = self.docs_checkpoint
149
  for i in range(len(self.docs["repetitions_ratio"])):
150
  self.docs["repetitions_ratio"].iloc[i] = self.docs["repetitions_ratio"].iloc[i][repetitions_length]