myquyen242 commited on
Commit
5df90c0
โ€ข
1 Parent(s): cc8d643

Upload 13 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ final_image_6.jpg filter=lfs diff=lfs merge=lfs -text
app(1).py ADDED
@@ -0,0 +1,96 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import streamlit as st
2
+ import pandas as pd
3
+ import matplotlib.pyplot as plt
4
+ import pandas_bokeh
5
+
6
+
7
+ # ๊ธ€ ์“ฐ๊ธฐ(๋งํฌ ์‚ฝ์ž…)
8
+ st.title('VIETNAM DONGDAEMUN FOOOOOOOOOD!!!!!!!!!')
9
+
10
+ st.header('Selection of Vietnamese Restaurants in Dongdaemun Area')
11
+ st.subheader('Variety of dishes from different region in Vietnam, made affordable and delicious for local taste')
12
+ st.subheader('Items such as Pho Soup, Bun Bo Hue, Cha Gio or Com Chien')
13
+ st.write('''Write something here about the booming of Vietnamese Restaurant in Korea - particularly the fast growing food scene in Dongdaemun [ํ‘ธ๋“œํŠธ๋Ÿญ](https://namu.wiki/w/%EB%B2%A0%ED%8A%B8%EB%82%A8%20%EC%9A%94%EB%A6%AC)
14
+ .''' )
15
+
16
+ # ์‚ฌ์ง„ ์‚ฝ์ž…
17
+ st.image('/content/drive/MyDrive/DATA JOURNALISM/final - may31/final_image_2.jpg', caption='A Spread of Vietnamese Dishes You Might Be Able To Find')
18
+
19
+ st.image('/content/drive/MyDrive/DATA JOURNALISM/final - may31/final_image_4.jpg', caption='A popular choice everywhere: Vietnamese Pho Soup')
20
+
21
+ st.image('/content/drive/MyDrive/DATA JOURNALISM/final - may31/final_image_3.jpg', caption='Hidden Gem: Banh Xeo')
22
+
23
+
24
+ st.header('Cheap and Delicious: One can find a variety of Vietnamese Restaurant in Dongdaemun Area')
25
+ st.subheader('Hosting dishes from North to South Vietnam')
26
+ st.subheader('The almost infinite choices will leave you looking for reviews!')
27
+ st.write('''Before deciding on which dish you'd want ~ carefully browse through the Blog section for an intimate look at the local food joints''' )
28
+
29
+ # ๋ฐ์ดํ„ฐ ๋ณด์—ฌ์ฃผ๊ธฐ
30
+ df_แ„€แ…งแ†ผแ„’แ…ดแ„ƒแ…ขแ„†แ…กแ†บแ„Œแ…ตแ†ธ = pd.read_excel('/content/drive/MyDrive/DATA JOURNALISM/final - may31/vietnam_food_dongdaemun_BLOGS.xlsx', index_col=0)
31
+ st.write('We have narrowed down to 150 most relevant blogs!!', df_แ„€แ…งแ†ผแ„’แ…ดแ„ƒแ…ขแ„†แ…กแ†บแ„Œแ…ตแ†ธ)
32
+
33
+ df_แ„€แ…งแ†ผแ„’แ…ดแ„ƒแ…ขแ„†แ…กแ†บแ„Œแ…ตแ†ธ_keyword = pd.read_excel('/content/drive/MyDrive/DATA JOURNALISM/final - may31/vietnam_food_KEYWORDS.xlsx', index_col=0)
34
+ st.write('๋ธ”๋กœ๊ทธ ๊ธ€์—์„œ ๊ฐ€์žฅ ๋งŽ์ด ์ถœํ˜„ํ•œ ๋‹จ์–ด๋Š” ~~~ ์„ค๋ช…~~~', df_แ„€แ…งแ†ผแ„’แ…ดแ„ƒแ…ขแ„†แ…กแ†บแ„Œแ…ตแ†ธ_keyword)
35
+
36
+
37
+
38
+ # ์›Œ๋“œํด๋ผ์šฐ๋“œ - WORDCLOUD
39
+ st.write('์ฃผ์š” ๋‹จ์–ด๋“ค์„ ์›Œ๋“œํด๋ผ์šฐ๋“œ๋กœ ๋ณด์—ฌ์ฃผ๋ฉด ๋‹ค์Œ๊ณผ ๊ฐ™๋‹ค')
40
+ st.image('/content/drive/MyDrive/DATA JOURNALISM/final - may31/final_WORDCLOUD.png')
41
+
42
+
43
+
44
+ # ์—ฐ๊ฒฐ๋ง ๋ถ„์„ - NETWORK
45
+ st.write('''์ทจ์žฌํŒ€์€ ์ฃผ์š” ๋‹จ์–ด๋“ค ๊ฐ„์— ๊ณต๋™์ถœํ˜„ํ•˜๋Š” ๊ด€๊ณ„๋ฅผ ๋ฐ”ํƒ•์œผ๋กœ ์˜๋ฏธ์—ฐ๊ฒฐ๋ง์„ ๊ทธ๋ ค๋ณด์•˜๋‹ค.
46
+ ๋ถ„์„๊ฒฐ๊ณผ, ~~์„ค๋ช…~~''')
47
+ st.image('/content/drive/MyDrive/DATA JOURNALISM/final - may31/final_NETWORK.png')
48
+
49
+ #### The Section Below Is Extra Stuff We Gotta Think About
50
+ '''
51
+ #
52
+ df_๊ตํ†ต์‚ฌ๊ณ  = pd.read_excel('/content/drive/MyDrive/2024_1_class/data_jour/data_traffic_accidents.xlsx', index_col=0)
53
+ st.write('๋‹ค์Œ ๋ฐ์ดํ„ฐ๋Š” ์ „๊ตญ์˜ ๊ตํ†ต์‚ฌ๊ณ ๋ฅผ ์ง€์—ญ๋ณ„๋กœ ์ง‘๊ณ„ํ•œ ๊ฒƒ์ด๋‹ค', df_๊ตํ†ต์‚ฌ๊ณ )
54
+
55
+ # ๊ฒ€์ƒ‰์–ด ์ž…๋ ฅ ๋ฐ›์•„ ์ถœ๋ ฅ
56
+ query = st.text_input('์ด ๊ณณ์— ์ง€์—ญ๋ช…(์‹œ๊ตฐ๊ตฌ๋™์๋ฉด)์„ ์ž…๋ ฅํ•˜๋ฉด ๊ด€๋ จ ๋ฐ์ดํ„ฐ๋งŒ ๊ฒ€์ƒ‰ํ•ด ๋ณด์—ฌ์ค๋‹ˆ๋‹ค', key='region1_input')
57
+ df_๊ตํ†ต์‚ฌ๊ณ ['select1']=df_๊ตํ†ต์‚ฌ๊ณ ['์‚ฌ๊ณ ์ง€์—ญ์œ„์น˜๋ช…'].apply(lambda x: 1 if query in x else 0)
58
+ st.write('๊ฒ€์ƒ‰ ๊ฒฐ๊ณผ:', df_๊ตํ†ต์‚ฌ๊ณ [df_๊ตํ†ต์‚ฌ๊ณ ['select1']==1])
59
+
60
+ # ๊ตํ†ต์‚ฌ๊ณ  ์œ ํ˜•๊ณผ ์—ฐ๋„์— ๋”ฐ๋ฅธ pivot table ๋ณด์—ฌ์ฃผ๊ธฐ
61
+ df_๊ตํ†ต์‚ฌ๊ณ _pivot=df_๊ตํ†ต์‚ฌ๊ณ .pivot_table(index='์‚ฌ๊ณ ์œ ํ˜•๊ตฌ๋ถ„', columns='์‚ฌ๊ณ ์—ฐ๋„', values='์‚ฌ๊ณ ๊ฑด์ˆ˜', aggfunc='sum')
62
+ df_๊ตํ†ต์‚ฌ๊ณ _heatmap=df_๊ตํ†ต์‚ฌ๊ณ _pivot.style.background_gradient(cmap='Oranges').format("{:.2f}")
63
+ st.write('๋‹ค์Œ ํ‘œ๋Š” ๊ตํ†ต์‚ฌ๊ณ  ๊ฑด์ˆ˜๋ฅผ ์œ ํ˜•๊ณผ ์—ฐ๋„์— ๋”ฐ๋ผ ๊ตฌ๋ถ„ํ•œ ๊ฒƒ์ด๋‹ค', df_๊ตํ†ต์‚ฌ๊ณ _heatmap)
64
+
65
+ # ๊ฒ€์ƒ‰์–ด ์ž…๋ ฅ ๋ฐ›์•„ pivot table ์ถœ๋ ฅ
66
+ query_pivot = st.text_input('์ด ๊ณณ์— ์ง€์—ญ๋ช…(์‹œ๊ตฐ๊ตฌ)์„ ์ž…๋ ฅํ•˜๋ฉด ๊ด€๋ จ ๋ฐ์ดํ„ฐ๋งŒ ๊ฒ€์ƒ‰ํ•ด ๋ณด์—ฌ์ค๋‹ˆ๋‹ค', key='region2_input')
67
+ df_๊ตํ†ต์‚ฌ๊ณ ['select2']=df_๊ตํ†ต์‚ฌ๊ณ ['์‚ฌ๊ณ ์ง€์—ญ์œ„์น˜๋ช…'].apply(lambda x: 1 if query_pivot in x else 0)
68
+ df_๊ตํ†ต์‚ฌ๊ณ _pivot_selected=df_๊ตํ†ต์‚ฌ๊ณ [df_๊ตํ†ต์‚ฌ๊ณ ['select2']==1].pivot_table(index='์‚ฌ๊ณ ์œ ํ˜•๊ตฌ๋ถ„', columns='์‚ฌ๊ณ ์—ฐ๋„', values='์‚ฌ๊ณ ๊ฑด์ˆ˜', aggfunc='sum')
69
+ df_๊ตํ†ต์‚ฌ๊ณ _heatmap_selected=df_๊ตํ†ต์‚ฌ๊ณ _pivot_selected.style.background_gradient(cmap='Oranges').format("{:.2f}")
70
+ st.write('๊ฒ€์ƒ‰ ๊ฒฐ๊ณผ:', df_๊ตํ†ต์‚ฌ๊ณ _heatmap_selected)
71
+
72
+ # pandas_bokeh ๊ทธ๋ž˜ํ”„ ๋ณด์—ฌ์ฃผ๊ธฐ
73
+ st.write('์ „๊ตญ ๊ตํ†ต์‚ฌ๊ณ  ๋ฐ์ดํ„ฐ์— ๋”ฐ๋ฅด๋ฉด, ์‚ฌ๊ณ ๊ฑด์ˆ˜์™€ ์ค‘์ƒ์ž์ˆ˜๋Š” ๋ฐ€์ ‘ํ•œ ๊ด€๋ จ์„ ๋งบ๊ณ  ์žˆ๋‹ค. ~~~์„ค๋ช…~~. *๊ทธ๋ž˜ํ”„ ๋‚ด ์ ์— ์ปค์„œ๋ฅผ ๋Œ€๋ฉด ์ง€์—ญ๋ช…์ด ๋‚˜ํƒ€๋‚œ๋‹ค')
74
+ p_scatter = df_๊ตํ†ต์‚ฌ๊ณ .plot_bokeh.scatter(
75
+ x="์‚ฌ๊ณ ๊ฑด์ˆ˜",
76
+ y="์ค‘์ƒ์ž์ˆ˜",
77
+ title="์‚ฌ๊ณ ๊ฑด์ˆ˜์™€ ์ค‘์ƒ์ž์ˆ˜",
78
+ size=10,
79
+ hovertool_string="""<h6>์œ„์น˜:@{์‚ฌ๊ณ ์ง€์—ญ์œ„์น˜๋ช…}</h6>"""
80
+ )
81
+ st.bokeh_chart(p_scatter, use_container_width=True)
82
+
83
+ # ์„ ํƒํ•œ ์กฐ๊ฑด์— ๋”ฐ๋ผ ์ถœ๋ ฅ
84
+ option = st.selectbox('์—ฐ๋„๋ฅผ ์„ ํƒํ•˜๋ฉด ํ•ด๋‹น ์‹œ๊ธฐ์˜ ๊ทธ๋ž˜ํ”„๋ฅผ ๋ณด์—ฌ์ค๋‹ˆ๋‹ค',
85
+ (2012, 2013, 2014, 2015, 2016, 2018, 2017, 2019, 2020, 2021), key='year_input')
86
+
87
+ p_scatter_selected = df_๊ตํ†ต์‚ฌ๊ณ [df_๊ตํ†ต์‚ฌ๊ณ ['์‚ฌ๊ณ ์—ฐ๋„']==option].plot_bokeh.scatter(
88
+ x="์‚ฌ๊ณ ๊ฑด์ˆ˜",
89
+ y="์ค‘์ƒ์ž์ˆ˜",
90
+ title="์‚ฌ๊ณ ๊ฑด์ˆ˜์™€ ์ค‘์ƒ์ž์ˆ˜",
91
+ size=10,
92
+ hovertool_string="""<h6>์œ„์น˜:@{์‚ฌ๊ณ ์ง€์—ญ์œ„์น˜๋ช…}</h6>"""
93
+ )
94
+ st.write('๊ฒ€์ƒ‰ ๊ฒฐ๊ณผ:')
95
+ st.bokeh_chart(p_scatter_selected, use_container_width=True)
96
+ '''
final_NETWORK.png ADDED
final_WORDCLOUD.png ADDED
final_image_1.jpg ADDED
final_image_2.jpg ADDED
final_image_3.jpg ADDED
final_image_4.jpg ADDED
final_image_5.jpg ADDED
final_image_6.jpg ADDED

Git LFS Details

  • SHA256: 9172102d4243c5f0c08ca250303ee3c23a10f8aa41f3fd9562c502b7c2345bfd
  • Pointer size: 132 Bytes
  • Size of remote file: 4.11 MB
pre_keywords.xlsx ADDED
Binary file (34.9 kB). View file
 
vietnam_food_KEYWORDS.xlsx ADDED
Binary file (10.9 kB). View file
 
vietnam_food_blog_NOUNS.xlsx ADDED
Binary file (60.4 kB). View file
 
vietnam_food_dongdaemun_BLOGS.xlsx ADDED
Binary file (28.7 kB). View file