snoop2head commited on
Commit
849819f
โ€ข
1 Parent(s): 498ff0a

upload post processing

Browse files
Files changed (1) hide show
  1. app.py +38 -6
app.py CHANGED
@@ -25,7 +25,7 @@ model = load_model("QuoQA-NLP/konec-privacy")
25
  model.eval()
26
 
27
 
28
- default_value = "์„ฑ์šฑ๋‹˜, ๋‹น๋‡จ ๊ฒ€์‚ฌํ•œ ๊ฑฐ ๊ฒฐ๊ณผ ๋‚˜์˜ค์…จ์–ด์š”."
29
 
30
  src_text = st.text_area(
31
  "๊ฒ€์‚ฌํ•˜๊ณ  ์‹ถ์€ ๋ฌธ์žฅ์„ ์ž…๋ ฅํ•˜์„ธ์š”.",
@@ -74,10 +74,10 @@ def yield_df(default_value):
74
  print(class_decoded)
75
 
76
  label_map = {
77
- "ADD": 0,
78
  "DN": "์งˆํ™˜ ์ •๋ณด",
79
  "DT": "๋‚ ์งœ ์ •๋ณด",
80
- "LC": "์ฃผ์†Œ ์ •๋ณด(์ง€์—ญ, ์ด๋ฉ”์ผ ์ฃผ์†Œ ๋“ฑ)",
81
  "OG": "๊ธฐ๊ด€ ์ •๋ณด",
82
  "PS": "์ธ๋ช…/๋ณ„๋ช… ์ •๋ณด",
83
  "QT": "์ˆ˜๋Ÿ‰ ์ •๋ณด",
@@ -85,6 +85,7 @@ def yield_df(default_value):
85
  "O": "๋น„๋ฏผ๊ฐ ์ •๋ณด"
86
  }
87
 
 
88
  # pair tokens with prediction
89
  tokenized_text = tokenizer.convert_ids_to_tokens(tokenized)
90
  list_result = []
@@ -99,7 +100,6 @@ def yield_df(default_value):
99
  df = pd.DataFrame(list_result)
100
  # remove first and last row
101
  df = df.iloc[1:-1]
102
- st.table(df)
103
  return df
104
 
105
  def convert_df(df:pd.DataFrame):
@@ -113,15 +113,45 @@ def convert_json(df:pd.DataFrame):
113
  return json_string
114
 
115
 
 
 
 
 
 
 
 
 
 
 
 
 
 
116
  if src_text == "":
117
  st.warning("Please **enter text** for translation")
118
  else:
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
119
  st.markdown("### ๋ถ„๋ฅ˜๋œ ๋‹จ์–ด๋“ค")
120
  st.header("")
121
  cs, c1, c2, c3, cLast = st.columns([0.75, 1.5, 1.5, 1.5, 0.75])
122
 
123
- df_result = yield_df(src_text)
124
-
125
  with c1:
126
  #csvbutton = download_button(results, "results.csv", "๐Ÿ“ฅ Download .csv")
127
  csvbutton = st.download_button(label="๐Ÿ“ฅ csv๋กœ ๋‹ค์šด๋กœ๋“œ", data=convert_df(df_result), file_name= "results.csv", mime='text/csv', key='csv')
@@ -132,6 +162,8 @@ else:
132
  #jsonbutton = download_button(results, "results.json", "๐Ÿ“ฅ Download .json")
133
  jsonbutton = st.download_button(label="๐Ÿ“ฅ json์œผ๋กœ ๋‹ค์šด๋กœ๋“œ", data=convert_json(df_result), file_name= "results.json", mime='application/json', key='json')
134
 
 
 
135
  with st.expander("(์ฃผ) ์ฟผ์นด์—์ด์•„์ด ๋ฐ๋ชจ ์‚ฌ์‚ฌ ๊ด€๋ จ", expanded=True):
136
 
137
  st.write(
 
25
  model.eval()
26
 
27
 
28
+ default_value = "์˜์ง„๋‹˜, ๋‹น๋‡จ ๊ฒ€์‚ฌํ•œ ๊ฑฐ ๊ฒฐ๊ณผ ๋‚˜์˜ค์…จ์–ด์š”."
29
 
30
  src_text = st.text_area(
31
  "๊ฒ€์‚ฌํ•˜๊ณ  ์‹ถ์€ ๋ฌธ์žฅ์„ ์ž…๋ ฅํ•˜์„ธ์š”.",
 
74
  print(class_decoded)
75
 
76
  label_map = {
77
+ "ADD": "์ฃผ์†Œ ์ •๋ณด",
78
  "DN": "์งˆํ™˜ ์ •๋ณด",
79
  "DT": "๋‚ ์งœ ์ •๋ณด",
80
+ "LC": "์žฅ์†Œ ์ •๋ณด",
81
  "OG": "๊ธฐ๊ด€ ์ •๋ณด",
82
  "PS": "์ธ๋ช…/๋ณ„๋ช… ์ •๋ณด",
83
  "QT": "์ˆ˜๋Ÿ‰ ์ •๋ณด",
 
85
  "O": "๋น„๋ฏผ๊ฐ ์ •๋ณด"
86
  }
87
 
88
+
89
  # pair tokens with prediction
90
  tokenized_text = tokenizer.convert_ids_to_tokens(tokenized)
91
  list_result = []
 
100
  df = pd.DataFrame(list_result)
101
  # remove first and last row
102
  df = df.iloc[1:-1]
 
103
  return df
104
 
105
  def convert_df(df:pd.DataFrame):
 
113
  return json_string
114
 
115
 
116
+
117
+ filtering_map = {
118
+ "์ฃผ์†Œ ์ •๋ณด": "[์ฃผ์†Œ]",
119
+ "์งˆํ™˜ ์ •๋ณด": "[์งˆํ™˜]",
120
+ "๋‚ ์งœ ์ •๋ณด": "[๋‚ ์งœ]",
121
+ "์žฅ์†Œ ์ •๋ณด": "[์žฅ์†Œ]",
122
+ "๊ธฐ๊ด€ ์ •๋ณด": "[๊ธฐ๊ด€]",
123
+ "์ธ๋ช…/๋ณ„๋ช… ์ •๋ณด": "[์ด๋ฆ„]",
124
+ "์ˆ˜๋Ÿ‰ ์ •๋ณด": "[์ˆ˜๋Ÿ‰]",
125
+ "๊ด€๊ณ„ ์ •๋ณด": "[๊ด€๊ณ„]",
126
+ "๋น„๋ฏผ๊ฐ ์ •๋ณด": "[๋น„๋ฏผ๊ฐ]"
127
+ }
128
+
129
  if src_text == "":
130
  st.warning("Please **enter text** for translation")
131
  else:
132
+ df_result = yield_df(src_text)
133
+ st.markdown("### ํ•„ํ„ฐ๋ง ๋œ ๋ฌธ์žฅ")
134
+
135
+ display_result = ""
136
+ for index, row in df_result.iterrows():
137
+ token_info = row["ํ˜•ํƒœ์†Œ"]
138
+ label_info = row["์˜ˆ์ƒ ๋ผ๋ฒจ"]
139
+ if label_info != "๋น„๋ฏผ๊ฐ ์ •๋ณด":
140
+ token_info = filtering_map[label_info]
141
+
142
+ if "##" in token_info:
143
+ token_info = token_info.replace("##", "")
144
+ else:
145
+ token_info = " " + token_info
146
+ display_result += token_info
147
+
148
+ st.write(display_result)
149
+
150
  st.markdown("### ๋ถ„๋ฅ˜๋œ ๋‹จ์–ด๋“ค")
151
  st.header("")
152
  cs, c1, c2, c3, cLast = st.columns([0.75, 1.5, 1.5, 1.5, 0.75])
153
 
154
+ st.table(df_result)
 
155
  with c1:
156
  #csvbutton = download_button(results, "results.csv", "๐Ÿ“ฅ Download .csv")
157
  csvbutton = st.download_button(label="๐Ÿ“ฅ csv๋กœ ๋‹ค์šด๋กœ๋“œ", data=convert_df(df_result), file_name= "results.csv", mime='text/csv', key='csv')
 
162
  #jsonbutton = download_button(results, "results.json", "๐Ÿ“ฅ Download .json")
163
  jsonbutton = st.download_button(label="๐Ÿ“ฅ json์œผ๋กœ ๋‹ค์šด๋กœ๋“œ", data=convert_json(df_result), file_name= "results.json", mime='application/json', key='json')
164
 
165
+
166
+
167
  with st.expander("(์ฃผ) ์ฟผ์นด์—์ด์•„์ด ๋ฐ๋ชจ ์‚ฌ์‚ฌ ๊ด€๋ จ", expanded=True):
168
 
169
  st.write(