Jonghyun Moon commited on
Commit
26f786b
โ€ข
1 Parent(s): 9842d55

deploy streamlit

Browse files
Files changed (4) hide show
  1. .gitignore +129 -0
  2. app.py +312 -0
  3. ballad_word.csv +0 -0
  4. requirements.txt +7 -0
.gitignore ADDED
@@ -0,0 +1,129 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ # Byte-compiled / optimized / DLL files
2
+ __pycache__/
3
+ *.py[cod]
4
+ *$py.class
5
+
6
+ # C extensions
7
+ *.so
8
+
9
+ # Distribution / packaging
10
+ .Python
11
+ build/
12
+ develop-eggs/
13
+ dist/
14
+ downloads/
15
+ eggs/
16
+ .eggs/
17
+ lib/
18
+ lib64/
19
+ parts/
20
+ sdist/
21
+ var/
22
+ wheels/
23
+ pip-wheel-metadata/
24
+ share/python-wheels/
25
+ *.egg-info/
26
+ .installed.cfg
27
+ *.egg
28
+ MANIFEST
29
+
30
+ # PyInstaller
31
+ # Usually these files are written by a python script from a template
32
+ # before PyInstaller builds the exe, so as to inject date/other infos into it.
33
+ *.manifest
34
+ *.spec
35
+
36
+ # Installer logs
37
+ pip-log.txt
38
+ pip-delete-this-directory.txt
39
+
40
+ # Unit test / coverage reports
41
+ htmlcov/
42
+ .tox/
43
+ .nox/
44
+ .coverage
45
+ .coverage.*
46
+ .cache
47
+ nosetests.xml
48
+ coverage.xml
49
+ *.cover
50
+ *.py,cover
51
+ .hypothesis/
52
+ .pytest_cache/
53
+
54
+ # Translations
55
+ *.mo
56
+ *.pot
57
+
58
+ # Django stuff:
59
+ *.log
60
+ local_settings.py
61
+ db.sqlite3
62
+ db.sqlite3-journal
63
+
64
+ # Flask stuff:
65
+ instance/
66
+ .webassets-cache
67
+
68
+ # Scrapy stuff:
69
+ .scrapy
70
+
71
+ # Sphinx documentation
72
+ docs/_build/
73
+
74
+ # PyBuilder
75
+ target/
76
+
77
+ # Jupyter Notebook
78
+ .ipynb_checkpoints
79
+
80
+ # IPython
81
+ profile_default/
82
+ ipython_config.py
83
+
84
+ # pyenv
85
+ .python-version
86
+
87
+ # pipenv
88
+ # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
89
+ # However, in case of collaboration, if having platform-specific dependencies or dependencies
90
+ # having no cross-platform support, pipenv may install dependencies that don't work, or not
91
+ # install all needed dependencies.
92
+ #Pipfile.lock
93
+
94
+ # PEP 582; used by e.g. github.com/David-OConnor/pyflow
95
+ __pypackages__/
96
+
97
+ # Celery stuff
98
+ celerybeat-schedule
99
+ celerybeat.pid
100
+
101
+ # SageMath parsed files
102
+ *.sage.py
103
+
104
+ # Environments
105
+ .env
106
+ .venv
107
+ env/
108
+ venv/
109
+ ENV/
110
+ env.bak/
111
+ venv.bak/
112
+
113
+ # Spyder project settings
114
+ .spyderproject
115
+ .spyproject
116
+
117
+ # Rope project settings
118
+ .ropeproject
119
+
120
+ # mkdocs documentation
121
+ /site
122
+
123
+ # mypy
124
+ .mypy_cache/
125
+ .dmypy.json
126
+ dmypy.json
127
+
128
+ # Pyre type checker
129
+ .pyre/
app.py ADDED
@@ -0,0 +1,312 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ import pandas as pd
2
+ import requests
3
+ import streamlit as st
4
+ from streamlit_lottie import st_lottie
5
+ import torch
6
+ from transformers import AutoTokenizer, AutoModelForCausalLM
7
+ import re
8
+
9
+ # Page Config
10
+ st.set_page_config(
11
+ page_title="๋…ธ๋ž˜ ๊ฐ€์‚ฌ nํ–‰์‹œ Beta",
12
+ page_icon="๐Ÿ’Œ",
13
+ layout="wide"
14
+ )
15
+ # st.text(os.listdir(os.curdir))
16
+
17
+ ### Model
18
+ tokenizer = AutoTokenizer.from_pretrained("wumusill/final_project_kogpt2")
19
+
20
+ @st.cache(show_spinner=False)
21
+ def load_model():
22
+ model = AutoModelForCausalLM.from_pretrained("wumusill/final_project_kogpt2")
23
+ return model
24
+
25
+ model = load_model()
26
+
27
+ @st.cache(show_spinner=False)
28
+ def get_word():
29
+ word = pd.read_csv("ballad_word.csv", encoding="cp949")
30
+ return word
31
+
32
+
33
+ word = get_word()
34
+
35
+
36
+ one = word[word["0"].str.startswith("ํ•œ")].sample(1).values[0][0]
37
+ # st.header(type(one))
38
+ # st.header(one)
39
+
40
+
41
+ # Class : Dict ์ค‘๋ณต ํ‚ค ์ถœ๋ ฅ
42
+ class poem(object):
43
+ def __init__(self,letter):
44
+ self.letter = letter
45
+
46
+ def __str__(self):
47
+ return self.letter
48
+
49
+ def __repr__(self):
50
+ return "'"+self.letter+"'"
51
+
52
+
53
+ def beta_poem(input_letter):
54
+ # ๋‘์Œ ๋ฒ•์น™ ์‚ฌ์ „
55
+ dooeum = {"๋ผ":"๋‚˜", "๋ฝ":"๋‚™", "๋ž€":"๋‚œ", "๋ž„":"๋‚ ", "๋žŒ":"๋‚จ", "๋ž":"๋‚ฉ", "๋ž‘":"๋‚ญ",
56
+ "๋ž˜":"๋‚ด", "๋žญ":"๋ƒ‰", "๋ƒ‘":"์•ฝ", "๋žต":"์•ฝ", "๋ƒฅ":"์–‘", "๋Ÿ‰":"์–‘", "๋…€":"์—ฌ",
57
+ "๋ ค":"์—ฌ", "๋…":"์—ญ", "๋ ฅ":"์—ญ", "๋…„":"์—ฐ", "๋ จ":"์—ฐ", "๋…ˆ":"์—ด", "๋ ฌ":"์—ด",
58
+ "๋…":"์—ผ", "๋ ด":"์—ผ", "๋ ต":"์—ฝ", "๋…•":"์˜", "๋ น":"์˜", "๋…œ":"์˜ˆ", "๋ก€":"์˜ˆ",
59
+ "๋กœ":"๋…ธ", "๋ก":"๋…น", "๋ก ":"๋…ผ", "๋กฑ":"๋†", "๋ขฐ":"๋‡Œ", "๋‡จ":"์š”", "๋ฃŒ":"์š”",
60
+ "๋ฃก":"์šฉ", "๋ฃจ":"๋ˆ„", "๋‰ด":"์œ ", "๋ฅ˜":"์œ ", "๋‰ต":"์œก", "๋ฅ™":"์œก", "๋ฅœ":"์œค",
61
+ "๋ฅ ":"์œจ", "๋ฅญ":"์œต", "๋ฅต":"๋Š‘", "๋ฆ„":"๋Š ", "๋ฆ‰":"๋Šฅ", "๋‹ˆ":"์ด", "๋ฆฌ":"์ด",
62
+ "๋ฆฐ":'์ธ', '๋ฆผ':'์ž„', '๋ฆฝ':'์ž…'}
63
+ # ๊ฒฐ๊ณผ๋ฌผ์„ ๋‹ด์„ list
64
+ res_l = []
65
+ len_sequence = 0
66
+
67
+ # ํ•œ ๊ธ€์ž์”ฉ ์ธ๋ฑ์Šค์™€ ํ•จ๊ป˜ ๊ฐ€์ ธ์˜ด
68
+ for idx, val in enumerate(input_letter):
69
+ # ๋‘์Œ ๋ฒ•์น™ ์ ์šฉ
70
+ if val in dooeum.keys():
71
+ val = dooeum[val]
72
+
73
+ # ๋ฐœ๋ผ๋“œ์— ์žˆ๋Š” ๋‹จ์–ด ์ ์šฉ
74
+ try:
75
+ one = word[word["0"].str.startswith(val)].sample(1).values[0][0]
76
+ # st.text(one)
77
+ except:
78
+ one = val
79
+
80
+ # ์ข€๋” ๋งค๋„๋Ÿฌ์šด ์‚ผํ–‰์‹œ๋ฅผ ์œ„ํ•ด ์ด์ „ ๋ฌธ์žฅ์ด๋ž‘ ํ˜„์žฌ ์Œ์ ˆ ์—ฐ๊ฒฐ
81
+ # ์ดํ›„ generate ๋œ ๋ฌธ์žฅ์—์„œ ์ด์ „ ๋ฌธ์žฅ์— ๋Œ€ํ•œ ๋ฐ์ดํ„ฐ ์ œ๊ฑฐ
82
+ link_with_pre_sentence = (" ".join(res_l)+ " " + one + " " if idx != 0 else one).strip()
83
+ # print(link_with_pre_sentence)
84
+
85
+ # ์—ฐ๊ฒฐ๋œ ๋ฌธ์žฅ์„ ์ธ์ฝ”๋”ฉ
86
+ input_ids = tokenizer.encode(link_with_pre_sentence, add_special_tokens=False, return_tensors="pt")
87
+
88
+ # ์ธ์ฝ”๋”ฉ ๊ฐ’์œผ๋กœ ๋ฌธ์žฅ ์ƒ์„ฑ
89
+ output_sequence = model.generate(
90
+ input_ids=input_ids,
91
+ do_sample=True,
92
+ max_length=42,
93
+ min_length=len_sequence + 2,
94
+ temperature=0.9,
95
+ repetition_penalty=1.5,
96
+ no_repeat_ngram_size=2)
97
+
98
+ # ์ƒ์„ฑ๋œ ๋ฌธ์žฅ ๋ฆฌ์ŠคํŠธ๋กœ ๋ณ€ํ™˜ (์ธ์ฝ”๋”ฉ ๋˜์–ด์žˆ๊ณ , ์ƒ์„ฑ๋œ ๋ฌธ์žฅ ๋’ค๋กœ padding ์ด ์žˆ๋Š” ์ƒํƒœ)
99
+ generated_sequence = output_sequence.tolist()[0]
100
+
101
+ # padding index ์•ž๊นŒ์ง€ slicing ํ•จ์œผ๋กœ์จ padding ์ œ๊ฑฐ, padding์ด ์—†์„ ์ˆ˜๋„ ์žˆ๊ธฐ ๋•Œ๋ฌธ์— ์กฐ๊ฑด๋ฌธ ํ™•์ธ ํ›„ ์ œ๊ฑฐ
102
+ # ์‚ฌ์šฉํ•  generated_sequence ๊ฐ€ 5๋ณด๋‹ค ์งง์œผ๋ฉด ๊ฐ•์ œ์ ์œผ๋กœ ๊ธธ์ด๋ฅผ 8๋กœ ํ•ด์ค€๋‹ค...
103
+ if tokenizer.pad_token_id in generated_sequence:
104
+ check_index = generated_sequence.index(tokenizer.pad_token_id)
105
+ check_index = check_index if check_index-len_sequence > 3 else len_sequence + 8
106
+ generated_sequence = generated_sequence[:check_index]
107
+
108
+ word_encode = tokenizer.encode(one, add_special_tokens=False, return_tensors="pt").tolist()[0][0]
109
+ split_index = len(generated_sequence) - 1 - generated_sequence[::-1].index(word_encode)
110
+
111
+ # ์ฒซ ๊ธ€์ž๊ฐ€ ์•„๋‹ˆ๋ผ๋ฉด, generate ๋œ ์Œ์ ˆ๋งŒ ๊ฒฐ๊ณผ๋ฌผ list์— ๋“ค์–ด๊ฐˆ ์ˆ˜ ์žˆ๊ฒŒ ์•ž ๋ฌธ์žฅ์— ๋Œ€ํ•œ ์ธ์ฝ”๋”ฉ ๊ฐ’ ์ œ๊ฑฐ
112
+ generated_sequence = generated_sequence[split_index:]
113
+
114
+ # print(tokenizer.decode(generated_sequence, clean_up_tokenization_spaces=True, skip_special_tokens=True))
115
+ # ๋‹ค์Œ ์Œ์ ˆ์„ ์œ„ํ•ด ๊ธธ์ด ๊ฐฑ์‹ 
116
+ len_sequence += len([elem for elem in generated_sequence if elem not in(tokenizer.all_special_ids)])
117
+ # ๊ฒฐ๊ณผ๋ฌผ ๋””์ฝ”๋”ฉ
118
+ decoded_sequence = tokenizer.decode(generated_sequence, clean_up_tokenization_spaces=True, skip_special_tokens=True)
119
+
120
+ # ๊ฒฐ๊ณผ๋ฌผ ๋ฆฌ์ŠคํŠธ์— ๋‹ด๊ธฐ
121
+ res_l.append(decoded_sequence)
122
+
123
+ poem_dict = {"Type":"beta"}
124
+
125
+ for letter, res in zip(input_letter, res_l):
126
+ # decode_res = tokenizer.decode(res, clean_up_tokenization_spaces=True, skip_special_tokens=True)
127
+ poem_dict[poem(letter)] = res
128
+
129
+ return poem_dict
130
+
131
+ def alpha_poem(input_letter):
132
+
133
+ # ๋‘์Œ ๋ฒ•์น™ ์‚ฌ์ „
134
+ dooeum = {"๋ผ":"๋‚˜", "๋ฝ":"๋‚™", "๋ž€":"๋‚œ", "๋ž„":"๋‚ ", "๋žŒ":"๋‚จ", "๋ž":"๋‚ฉ", "๋ž‘":"๋‚ญ",
135
+ "๋ž˜":"๋‚ด", "๋žญ":"๋ƒ‰", "๋ƒ‘":"์•ฝ", "๋žต":"์•ฝ", "๋ƒฅ":"์–‘", "๋Ÿ‰":"์–‘", "๋…€":"์—ฌ",
136
+ "๋ ค":"์—ฌ", "๋…":"์—ญ", "๋ ฅ":"์—ญ", "๋…„":"์—ฐ", "๋ จ":"์—ฐ", "๋…ˆ":"์—ด", "๋ ฌ":"์—ด",
137
+ "๋…":"์—ผ", "๋ ด":"์—ผ", "๋ ต":"์—ฝ", "๋…•":"์˜", "๋ น":"์˜", "๋…œ":"์˜ˆ", "๋ก€":"์˜ˆ",
138
+ "๋กœ":"๋…ธ", "๋ก":"๋…น", "๋ก ":"๋…ผ", "๋กฑ":"๋†", "๋ขฐ":"๋‡Œ", "๋‡จ":"์š”", "๋ฃŒ":"์š”",
139
+ "๋ฃก":"์šฉ", "๋ฃจ":"๋ˆ„", "๋‰ด":"์œ ", "๋ฅ˜":"์œ ", "๋‰ต":"์œก", "๋ฅ™":"์œก", "๋ฅœ":"์œค",
140
+ "๋ฅ ":"์œจ", "๋ฅญ":"์œต", "๋ฅต":"๋Š‘", "๋ฆ„":"๋Š ", "๋ฆ‰":"๋Šฅ", "๋‹ˆ":"์ด", "๋ฆฌ":"์ด",
141
+ "๋ฆฐ":'์ธ', '๋ฆผ':'์ž„', '๋ฆฝ':'์ž…'}
142
+ # ๊ฒฐ๊ณผ๋ฌผ์„ ๋‹ด์„ list
143
+ res_l = []
144
+
145
+ # ํ•œ ๊ธ€์ž์”ฉ ์ธ๋ฑ์Šค์™€ ํ•จ๊ป˜ ๊ฐ€์ ธ์˜ด
146
+ for idx, val in enumerate(input_letter):
147
+ # ๋‘์Œ ๋ฒ•์น™ ์ ์šฉ
148
+ if val in dooeum.keys():
149
+ val = dooeum[val]
150
+
151
+
152
+ while True:
153
+ # ๋งŒ์•ฝ idx ๊ฐ€ 0 ์ด๋ผ๋ฉด == ์ฒซ ๊ธ€์ž
154
+ if idx == 0:
155
+ # ์ฒซ ๊ธ€์ž ์ธ์ฝ”๋”ฉ
156
+ input_ids = tokenizer.encode(
157
+ val, add_special_tokens=False, return_tensors="pt")
158
+ # print(f"{idx}๋ฒˆ ์ธ์ฝ”๋”ฉ : {input_ids}\n") # 2์ฐจ์› ํ…์„œ
159
+
160
+ # ์ฒซ ๊ธ€์ž ์ธ์ฝ”๋”ฉ ๊ฐ’์œผ๋กœ ๋ฌธ์žฅ ์ƒ์„ฑ
161
+ output_sequence = model.generate(
162
+ input_ids=input_ids,
163
+ do_sample=True,
164
+ max_length=42,
165
+ min_length=5,
166
+ temperature=0.9,
167
+ repetition_penalty=1.7,
168
+ no_repeat_ngram_size=2)[0]
169
+ # print("์ฒซ ๊ธ€์ž ์ธ์ฝ”๋”ฉ ํ›„ generate ๊ฒฐ๊ณผ:", output_sequence, "\n") # tensor
170
+
171
+ # ์ฒซ ๊ธ€์ž๊ฐ€ ์•„๋‹ˆ๋ผ๋ฉด
172
+ else:
173
+ # ํ•œ ์Œ์ ˆ
174
+ input_ids = tokenizer.encode(
175
+ val, add_special_tokens=False, return_tensors="pt")
176
+ # print(f"{idx}๋ฒˆ ์งธ ๊ธ€์ž ์ธ์ฝ”๋”ฉ : {input_ids} \n")
177
+
178
+ # ์ข€๋” ๋งค๋„๋Ÿฌ์šด ์‚ผํ–‰์‹œ๋ฅผ ์œ„ํ•ด ์ด์ „ ์ธ์ฝ”๋”ฉ๊ณผ ์ง€๊ธˆ ์ธ์ฝ”๋”ฉ ์—ฐ๊ฒฐ
179
+ link_with_pre_sentence = torch.cat((generated_sequence, input_ids[0]), 0)
180
+ link_with_pre_sentence = torch.reshape(link_with_pre_sentence, (1, len(link_with_pre_sentence)))
181
+ # print(f"์ด์ „ ํ…์„œ์™€ ์—ฐ๊ฒฐ๋œ ํ…์„œ {link_with_pre_sentence} \n")
182
+
183
+ # ์ธ์ฝ”๋”ฉ ๊ฐ’์œผ๋กœ ๋ฌธ์žฅ ์ƒ์„ฑ
184
+ output_sequence = model.generate(
185
+ input_ids=link_with_pre_sentence,
186
+ do_sample=True,
187
+ max_length=42,
188
+ min_length=5,
189
+ temperature=0.9,
190
+ repetition_penalty=1.7,
191
+ no_repeat_ngram_size=2)[0]
192
+ # print(f"{idx}๋ฒˆ ์ธ์ฝ”๋”ฉ ํ›„ generate : {output_sequence}")
193
+
194
+ # ์ƒ์„ฑ๋œ ๋ฌธ์žฅ ๋ฆฌ์ŠคํŠธ๋กœ ๋ณ€ํ™˜ (์ธ์ฝ”๋”ฉ ๋˜์–ด์žˆ๊ณ , ์ƒ์„ฑ๋œ ๋ฌธ์žฅ ๋’ค๋กœ padding ์ด ์žˆ๋Š” ์ƒํƒœ)
195
+ generated_sequence = output_sequence.tolist()
196
+ # print(f"{idx}๋ฒˆ ์ธ์ฝ”๋”ฉ ๋ฆฌ์ŠคํŠธ : {generated_sequence} \n")
197
+
198
+ # padding index ์•ž๊นŒ์ง€ slicing ํ•จ์œผ๋กœ์จ padding ์ œ๊ฑฐ, padding์ด ์—†์„ ์ˆ˜๋„ ์žˆ๊ธฐ ๋•Œ๋ฌธ์— ์กฐ๊ฑด๋ฌธ ํ™•์ธ ํ›„ ์ œ๊ฑฐ
199
+ if tokenizer.pad_token_id in generated_sequence:
200
+ generated_sequence = generated_sequence[:generated_sequence.index(tokenizer.pad_token_id)]
201
+
202
+ generated_sequence = torch.tensor(generated_sequence)
203
+ # print(f"{idx}๋ฒˆ ์ธ์ฝ”๋”ฉ ๋ฆฌ์ŠคํŠธ ํŒจ๋”ฉ ์ œ๊ฑฐ ํ›„ ๋‹ค์‹œ ํ…์„œ : {generated_sequence} \n")
204
+
205
+ # ์ฒซ ๊ธ€์ž๊ฐ€ ์•„๋‹ˆ๋ผ๋ฉด, generate ๋œ ์Œ์ ˆ๋งŒ ๊ฒฐ๊ณผ๋ฌผ list์— ๋“ค์–ด๊ฐˆ ์ˆ˜ ์žˆ๊ฒŒ ์•ž ๋ฌธ์žฅ์— ๋Œ€ํ•œ ์ธ์ฝ”๋”ฉ ๊ฐ’ ์ œ๊ฑฐ
206
+ # print(generated_sequence)
207
+ if idx != 0:
208
+ # ์ด์ „ ๋ฌธ์žฅ์˜ ๊ธธ์ด ์ดํ›„๋กœ ์Šฌ๋ผ์ด์‹ฑํ•ด์„œ ์•ž ๋ฌธ์žฅ ์ œ๊ฑฐ
209
+ generated_sequence = generated_sequence[len_sequence:]
210
+
211
+ len_sequence = len(generated_sequence)
212
+ # print("len_seq", len_sequence)
213
+
214
+ # ์Œ์ ˆ ๊ทธ๋Œ€๋กœ ๋ฑ‰์œผ๋ฉด ๋‹ค์‹œ ํ•ด์™€, ์•„๋‹ˆ๋ฉด while๋ฌธ ํƒˆ์ถœ
215
+ if len_sequence > 1:
216
+ break
217
+
218
+ # ๊ฒฐ๊ณผ๋ฌผ ๋ฆฌ์ŠคํŠธ์— ๋‹ด๊ธฐ
219
+ res_l.append(generated_sequence)
220
+
221
+ poem_dict = {"Type":"alpha"}
222
+
223
+ for letter, res in zip(input_letter, res_l):
224
+ decode_res = tokenizer.decode(res, clean_up_tokenization_spaces=True, skip_special_tokens=True)
225
+ poem_dict[poem(letter)] = decode_res
226
+
227
+ return poem_dict
228
+
229
+ # Image(.gif)
230
+ @st.cache(show_spinner=False)
231
+ def load_lottieurl(url: str):
232
+ r = requests.get(url)
233
+ if r.status_code != 200:
234
+ return None
235
+ return r.json()
236
+
237
+ lottie_url = "https://assets7.lottiefiles.com/private_files/lf30_fjln45y5.json"
238
+
239
+ lottie_json = load_lottieurl(lottie_url)
240
+ st_lottie(lottie_json, speed=1, height=200, key="initial")
241
+
242
+
243
+ # Title
244
+ row0_spacer1, row0_1, row0_spacer2, row0_2, row0_spacer3 = st.columns(
245
+ (0.01, 2, 0.05, 0.5, 0.01)
246
+ )
247
+
248
+ with row0_1:
249
+ st.markdown("# ํ•œ๊ธ€ ๋…ธ๋ž˜ ๊ฐ€์‚ฌ nํ–‰์‹œโœ")
250
+ st.markdown("### ๐Ÿฆ๋ฉ‹์Ÿ์ด์‚ฌ์ž์ฒ˜๋Ÿผ AIS7๐Ÿฆ - ํŒŒ์ด๋„ ํ”„๋กœ์ ํŠธ")
251
+
252
+ with row0_2:
253
+ st.write("")
254
+ st.write("")
255
+ st.write("")
256
+ st.subheader("1์กฐ - ํ•ดํŒŒ๋ฆฌ")
257
+ st.write("์ด์ง€ํ˜œ, ์ตœ์ง€์˜, ๊ถŒ์†Œํฌ, ๋ฌธ์ข…ํ˜„, ๊ตฌ์žํ˜„, ๊น€์˜์ค€")
258
+
259
+ st.write('---')
260
+
261
+ # Explanation
262
+ row1_spacer1, row1_1, row1_spacer2 = st.columns((0.01, 0.01, 0.01))
263
+
264
+ with row1_1:
265
+ st.markdown("### nํ–‰์‹œ ๊ฐ€์ด๋“œ๋ผ์ธ")
266
+ st.markdown("1. ํ•˜๋‹จ์— ์žˆ๋Š” ํ…์ŠคํŠธ๋ฐ”์— 5์ž ์ดํ•˜ ๋‹จ์–ด๋ฅผ ๋„ฃ์–ด์ฃผ์„ธ์š”")
267
+ st.markdown("2. 'nํ–‰์‹œ ์ œ์ž‘ํ•˜๊ธฐ' ๋ฒ„ํŠผ์„ ํด๋ฆญํ•ด์ฃผ์„ธ์š”")
268
+ st.markdown("* nํ–‰์‹œ ํƒ€์ž… ์„ค์ •\n"
269
+ " * Alpha ver. : ๋ชจ๋ธ์ด ์ฒซ ์Œ์ ˆ๋ถ€ํ„ฐ ์ƒ์„ฑ\n"
270
+ " * Beta ver. : ์ฒซ ์Œ์ ˆ์„ ๋ฐ์ดํ„ฐ์…‹์—์„œ ์ฐพ๊ณ , ๋‹ค์Œ ๋ถ€๋ถ„์„ ์ƒ์„ฑ")
271
+
272
+ st.write('---')
273
+
274
+ # Model & Input
275
+ row2_spacer1, row2_1, row2_spacer2= st.columns((0.01, 0.01, 0.01))
276
+
277
+ col1, col2 = st.columns(2)
278
+
279
+ # Word Input
280
+ with row2_1:
281
+
282
+ with col1:
283
+ genre = st.radio(
284
+ "nํ–‰์‹œ ํƒ€์ž… ์„ ํƒ",
285
+ ('Alpha', 'Beta(test์ค‘)'))
286
+
287
+ if genre == 'Alpha':
288
+ n_line_poem = alpha_poem
289
+
290
+ else:
291
+ n_line_poem = beta_poem
292
+
293
+ with col2:
294
+ word_input = st.text_input(
295
+ "nํ–‰์‹œ์— ์‚ฌ์šฉํ•  ๋‹จ์–ด๋ฅผ ์ ๊ณ  ๋ฒ„ํŠผ์„ ๋ˆŒ๋Ÿฌ์ฃผ์„ธ์š”.(์ตœ๋Œ€ 5์ž) ๐Ÿ‘‡",
296
+ placeholder='ํ•œ๊ธ€ ๋‹จ์–ด๋ฅผ ์ž…๋ ฅํ•ด์ฃผ์„ธ์š”',
297
+ max_chars=5
298
+ )
299
+ word_input = re.sub("[^๊ฐ€-ํžฃ]", "", word_input)
300
+
301
+ if st.button('nํ–‰์‹œ ์ œ์ž‘ํ•˜๊ธฐ'):
302
+ if word_input == "":
303
+ st.error("์˜จ์ „ํ•œ ํ•œ๊ธ€ ๋‹จ์–ด๋ฅผ ์‚ฌ์šฉํ•ด์ฃผ์„ธ์š”!")
304
+
305
+ else:
306
+ st.write("nํ–‰์‹œ ๋‹จ์–ด : ", word_input)
307
+ with st.spinner('์ž ์‹œ ๊ธฐ๋‹ค๋ ค์ฃผ์„ธ์š”...'):
308
+ result = n_line_poem(word_input)
309
+ st.success('์™„๋ฃŒ๋์Šต๋‹ˆ๋‹ค!')
310
+ for r in result:
311
+ st.write(f'{r} : {result[r]}')
312
+
ballad_word.csv ADDED
The diff for this file is too large to render. See raw diff
 
requirements.txt ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ pandas
2
+ # numpy
3
+ streamlit
4
+ requests
5
+ streamlit_lottie
6
+ torch
7
+ transformers