Update app.py
Browse files
app.py
CHANGED
@@ -191,16 +191,17 @@ if not USE_CACHE:
|
|
191 |
if LIMIT is not None:
|
192 |
print(f"LIMIT: {LIMIT}")
|
193 |
|
194 |
-
# digest store
|
195 |
digests = dict() # key is cluster, value is digestor object
|
196 |
-
out_dicts = []
|
197 |
# list to accept user choices
|
198 |
# retrieve cluster data and create dict to track each article (articleStubs)
|
199 |
# and create topic clusters by performing ner.
|
200 |
print("Initializing....")
|
201 |
article_dict, clusters = initialize(LIMIT, USE_CACHE)
|
202 |
-
# We now have clusters and cluster data. Redundancy
|
203 |
-
|
|
|
204 |
st.title("Welcome to TopicDig!")
|
205 |
st.success(f"You select the topics, we summarize the relevant news and show you a digest, plus some info to help contextualize what the machine did.")
|
206 |
|
@@ -209,6 +210,7 @@ st.warning("Enjoy, and remember, these summaries contain a few kinds of issues,
|
|
209 |
st.subheader(f"How it works:")
|
210 |
st.write(f"""Select 1 to 3 topics from the drop down menus and click 'submit' to start generating your digest!""")
|
211 |
|
|
|
212 |
with st.expander("See extra options"):
|
213 |
st.subheader("Refresh topics: ")
|
214 |
st.write("You may want to refresh the topic lists if the app loaded several hours ago or you get no summary.")
|
@@ -225,27 +227,19 @@ selections = []
|
|
225 |
choices = list(clusters.keys())
|
226 |
choices.insert(0,'None')
|
227 |
|
|
|
228 |
# st.write(f"CNN articles: {st.session_state['cnn']}")
|
229 |
# st.write(f"NPR articles: {st.session_state['npr']}")
|
230 |
# st.write(f"Number of clusters {st.session_state['num_clusters']}")
|
231 |
|
232 |
-
|
233 |
st.sidebar.subheader("Topics")
|
234 |
show_clusters = {i:len(clusters[i]) for i in clusters.keys()}
|
235 |
cdf = pd.DataFrame(data={"Articles":list(show_clusters.values()), "Cluster":list(show_clusters.keys())} )
|
236 |
styler = cdf.style.hide_index()
|
237 |
-
st.write(styler.to_html(), unsafe_allow_html=True)
|
238 |
-
|
239 |
-
#st.write(df.to_html(index=False), unsafe_allow_html=True)
|
240 |
-
st.sidebar.table(styler)
|
241 |
-
|
242 |
-
|
243 |
-
"""
|
244 |
-
show_clusters.sort(key=lambda x: len(x[1]), reverse=True)
|
245 |
-
for i in show_clusters:
|
246 |
-
st.sidebar.write(f"{i[0]} : {len(i[1])}")
|
247 |
-
"""
|
248 |
|
|
|
249 |
st.session_state['dt'] = dt.now()
|
250 |
# Form used to take 3 menu inputs
|
251 |
with st.form(key='columns_in_form'):
|
|
|
191 |
if LIMIT is not None:
|
192 |
print(f"LIMIT: {LIMIT}")
|
193 |
|
194 |
+
# digest store am I using this though? - april 15 2022
|
195 |
digests = dict() # key is cluster, value is digestor object
|
196 |
+
out_dicts = [] # Am I using this? -dit
|
197 |
# list to accept user choices
|
198 |
# retrieve cluster data and create dict to track each article (articleStubs)
|
199 |
# and create topic clusters by performing ner.
|
200 |
print("Initializing....")
|
201 |
article_dict, clusters = initialize(LIMIT, USE_CACHE)
|
202 |
+
# We now have clusters and cluster data. Redundancy?
|
203 |
+
|
204 |
+
# Welcome and explainer
|
205 |
st.title("Welcome to TopicDig!")
|
206 |
st.success(f"You select the topics, we summarize the relevant news and show you a digest, plus some info to help contextualize what the machine did.")
|
207 |
|
|
|
210 |
st.subheader(f"How it works:")
|
211 |
st.write(f"""Select 1 to 3 topics from the drop down menus and click 'submit' to start generating your digest!""")
|
212 |
|
213 |
+
# Provides expandable container for refresh and summarization parameters, currently only chunk size
|
214 |
with st.expander("See extra options"):
|
215 |
st.subheader("Refresh topics: ")
|
216 |
st.write("You may want to refresh the topic lists if the app loaded several hours ago or you get no summary.")
|
|
|
227 |
choices = list(clusters.keys())
|
228 |
choices.insert(0,'None')
|
229 |
|
230 |
+
# May be desired in sidebar - april 15 2022
|
231 |
# st.write(f"CNN articles: {st.session_state['cnn']}")
|
232 |
# st.write(f"NPR articles: {st.session_state['npr']}")
|
233 |
# st.write(f"Number of clusters {st.session_state['num_clusters']}")
|
234 |
|
235 |
+
# Display topics to user currently in sidebar - april 15 2022
|
236 |
st.sidebar.subheader("Topics")
|
237 |
show_clusters = {i:len(clusters[i]) for i in clusters.keys()}
|
238 |
cdf = pd.DataFrame(data={"Articles":list(show_clusters.values()), "Cluster":list(show_clusters.keys())} )
|
239 |
styler = cdf.style.hide_index()
|
240 |
+
st.sidebar.write(styler.to_html(), unsafe_allow_html=True)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
241 |
|
242 |
+
# Get session time
|
243 |
st.session_state['dt'] = dt.now()
|
244 |
# Form used to take 3 menu inputs
|
245 |
with st.form(key='columns_in_form'):
|