AlbertoFH98 commited on
Commit
24bbdf7
1 Parent(s): 66216e0

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +26 -21
app.py CHANGED
@@ -15,11 +15,10 @@ import spacy
15
  import time
16
  import os
17
  import re
 
18
 
19
  @st.cache
20
  def get_args():
21
- st.set_page_config(layout="wide")
22
-
23
  # -- 1. Setup arguments
24
  parser = argparse.ArgumentParser()
25
  parser.add_argument('--DEFAULT_SYSTEM_PROMPT_LINK', type=str, default="https://raw.githubusercontent.com/AlbertoUAH/Castena/main/prompts/default_system_prompt.txt", help='Valor para DEFAULT_SYSTEM_PROMPT_LINK')
@@ -43,25 +42,12 @@ def get_podcast_data(transcription_path):
43
  together.Models.start(MODEL)
44
  podcast_url_video_df = pd.read_csv(PODCAST_URL_VIDEO_PATH, sep=';')
45
  return podcast_url_video_df
46
-
47
- def main():
48
- args = get_args()
49
- B_INST, E_INST = "[INST]", "[/INST]"
50
- B_SYS, E_SYS = "<<SYS>>\n", "\n<</SYS>>\n\n"
51
-
52
- # -- 4. Get parameters
53
- PODCAST_URL_VIDEO_PATH = args.PODCAST_URL_VIDEO_PATH
54
- DEFAULT_SYSTEM_PROMPT_LINK = args.DEFAULT_SYSTEM_PROMPT_LINK
55
- TRANSCRIPTION = args.TRANSCRIPTION
56
- TRANSCRIPTION_PATH = '{}_transcription.txt'.format(TRANSCRIPTION)
57
- MODEL = args.MODEL
58
- EMB_MODEL = args.EMB_MODEL
59
-
60
- podcast_url_video_df = get_podcast_data(TRANSCRIPTION_PATH)
61
 
62
- r = requests.get("https://raw.githubusercontent.com/AlbertoUAH/Castena/main/media/castena-animated-icon.gif", stream=True)
 
 
63
  icon = Image.open(r.raw)
64
- icon = icon.resize((100, 100))
65
  st.sidebar.image(icon)
66
  video_option = st.sidebar.selectbox(
67
  "Seleccione el podcast",
@@ -72,11 +58,30 @@ def main():
72
  youtube_video_url = list(podcast_url_video_df[podcast_url_video_df['podcast_name'].str.contains(video_option_joined)]['youtube_video_url'])[0].replace("\'", "")
73
 
74
  # -- 4. Setup request for system prompt
75
- f = urllib.request.urlopen(DEFAULT_SYSTEM_PROMPT_LINK)
76
  DEFAULT_SYSTEM_PROMPT = str(f.read(), 'UTF-8')
77
 
78
  # -- 5. Setup app
79
- translator, nlp, retriever = utils.setup_app(video_option_joined_path, EMB_MODEL, MODEL, logger)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
80
 
81
 
82
  # -- 6. Setup prompt template + llm chain
 
15
  import time
16
  import os
17
  import re
18
+ st.set_page_config(layout="wide")
19
 
20
  @st.cache
21
  def get_args():
 
 
22
  # -- 1. Setup arguments
23
  parser = argparse.ArgumentParser()
24
  parser.add_argument('--DEFAULT_SYSTEM_PROMPT_LINK', type=str, default="https://raw.githubusercontent.com/AlbertoUAH/Castena/main/prompts/default_system_prompt.txt", help='Valor para DEFAULT_SYSTEM_PROMPT_LINK')
 
42
  together.Models.start(MODEL)
43
  podcast_url_video_df = pd.read_csv(PODCAST_URL_VIDEO_PATH, sep=';')
44
  return podcast_url_video_df
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
45
 
46
+ @st.cache
47
+ def setup_basics_comp(emb_model, model, default_system_prompt_link, logger, podcast_url_video_df, img_size=100):
48
+ r = requests.get("https://raw.githubusercontent.com/AlbertoUAH/Castena/main/media/castena-animated-icon.gif", stream=True)
49
  icon = Image.open(r.raw)
50
+ icon = icon.resize((img_size, img_size))
51
  st.sidebar.image(icon)
52
  video_option = st.sidebar.selectbox(
53
  "Seleccione el podcast",
 
58
  youtube_video_url = list(podcast_url_video_df[podcast_url_video_df['podcast_name'].str.contains(video_option_joined)]['youtube_video_url'])[0].replace("\'", "")
59
 
60
  # -- 4. Setup request for system prompt
61
+ f = urllib.request.urlopen(default_system_prompt_link)
62
  DEFAULT_SYSTEM_PROMPT = str(f.read(), 'UTF-8')
63
 
64
  # -- 5. Setup app
65
+ translator, nlp, retriever = utils.setup_app(video_option_joined_path, emb_model, model, logger)
66
+ return translator, nlp, retriever, video_option, video_option_joined_path
67
+
68
+ def main():
69
+ args = get_args()
70
+ B_INST, E_INST = "[INST]", "[/INST]"
71
+ B_SYS, E_SYS = "<<SYS>>\n", "\n<</SYS>>\n\n"
72
+
73
+ PODCAST_URL_VIDEO_PATH = args.PODCAST_URL_VIDEO_PATH
74
+ DEFAULT_SYSTEM_PROMPT_LINK = args.DEFAULT_SYSTEM_PROMPT_LINK
75
+ TRANSCRIPTION = args.TRANSCRIPTION
76
+ TRANSCRIPTION_PATH = '{}_transcription.txt'.format(TRANSCRIPTION)
77
+ MODEL = args.MODEL
78
+ EMB_MODEL = args.EMB_MODEL
79
+
80
+ podcast_url_video_df = get_podcast_data(TRANSCRIPTION_PATH)
81
+
82
+ translator, nlp, retriever, video_option, video_option_joined_path = setup_basics_comp(EMB_MODEL, MODEL,
83
+ DEFAULT_SYSTEM_PROMPT_LINK, logger,
84
+ podcast_url_video_df, img_size=100)
85
 
86
 
87
  # -- 6. Setup prompt template + llm chain