Spaces:

awacke1
/

Search_Streamlit

Build error

App Files Files Community

awacke1 commited on Jun 24, 2022

Commit

6d3b539

•

1 Parent(s): c5ae802

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -35

app.py CHANGED Viewed

@@ -49,8 +49,10 @@ if query_params:
 selected_option = st.radio(
     "Param", options, index=ix, key="query", on_change=update_params
 )
-st.experimental_set_query_params(option=selected_option)
 try:
     st.session_state.query = query  # if set already above.  this prevents two interface elements setting it first time once
@@ -77,28 +79,6 @@ except: # catch exception and set query param to predefined value
     query_option = query_params['query'][0]
     query_option = "ai"
-# What impresses me about these two beautiful new streamlit persist prims is that one called the singleton can share memory across sessions (think all users yo)
-#@st.experimental_singleton
-#def get_sessionmaker(search_param):
-#	url = "https://en.wikipedia.org/wiki/"
-#	return url
-#search_param = "Star_Trek:_Discovery"
-#sm=  get_sessionmaker(search_param)
-# What is supercool about the second prim the memo is it makes unwieldy data very wieldy.  Like the Lord of Rings in reverse re "you cannot wield it!  none of us can." ->  "You can wield it, now everyone can."
-#@st.experimental_memo
-#def factorial(n):
-#	if n < 1:
-#		return 1
-#	return n * factorial(n - 1)
-#em10 = factorial(10)
-#em09 = factorial(9)  # Returns instantly!
 DEVICE = "cpu"
 MODEL_OPTIONS = ["msmarco-distilbert-base-tas-b", "all-mpnet-base-v2"]
 DESCRIPTION = """
@@ -144,14 +124,10 @@ def load():
     df = pd.read_csv("movies.csv")
     return tokenizers, models, embeddings, df
 tokenizers, models, embeddings, df = load()
 def pooling(model_output):
     return model_output.last_hidden_state[:, 0]
 def compute_embeddings(texts):
     encoded_input = tokenizers[0](
         texts, padding=True, truncation=True, return_tensors="pt"
@@ -161,10 +137,8 @@ def compute_embeddings(texts):
         model_output = models[0](**encoded_input, return_dict=True)
     embeddings = pooling(model_output)
     return embeddings.cpu().numpy()
 def pooling2(model_output, attention_mask):
     token_embeddings = model_output[0]
     input_mask_expanded = (
@@ -174,7 +148,6 @@ def pooling2(model_output, attention_mask):
         input_mask_expanded.sum(1), min=1e-9
     )
 def compute_embeddings2(list_of_strings):
     encoded_input = tokenizers[1](
         list_of_strings, padding=True, truncation=True, return_tensors="pt"
@@ -184,7 +157,6 @@ def compute_embeddings2(list_of_strings):
     sentence_embeddings = pooling2(model_output, encoded_input["attention_mask"])
     return F.normalize(sentence_embeddings, p=2, dim=1).cpu().numpy()
 @st.cache(
     show_spinner=False,
     hash_funcs={Tokenizer: lambda _: None, AddedToken: lambda _: None},
@@ -219,15 +191,11 @@ def semantic_search(query, model_id):
     delay = "%.3f" % (time.time() - start)
     return f"<p><i>Computation time: {delay} seconds</i></p>{result}</ol>"
 st.sidebar.markdown(DESCRIPTION)
 model_choice = st.sidebar.selectbox("Similarity model", options=MODEL_OPTIONS)
 model_id = 0 if model_choice == MODEL_OPTIONS[0] else 1
 clicked = click_detector(semantic_search(query, model_id))
 if clicked != "":

 selected_option = st.radio(
     "Param", options, index=ix, key="query", on_change=update_params
 )
+st.write("<style>div.row-widget.stRadio > div{flex-direction:row;}</style>", unsafe_allow_html=True)
+st.experimental_set_query_params(option=selected_option)
 try:
     st.session_state.query = query  # if set already above.  this prevents two interface elements setting it first time once
     query_option = query_params['query'][0]
     query_option = "ai"
 DEVICE = "cpu"
 MODEL_OPTIONS = ["msmarco-distilbert-base-tas-b", "all-mpnet-base-v2"]
 DESCRIPTION = """
     df = pd.read_csv("movies.csv")
     return tokenizers, models, embeddings, df
 tokenizers, models, embeddings, df = load()
 def pooling(model_output):
     return model_output.last_hidden_state[:, 0]
 def compute_embeddings(texts):
     encoded_input = tokenizers[0](
         texts, padding=True, truncation=True, return_tensors="pt"
         model_output = models[0](**encoded_input, return_dict=True)
     embeddings = pooling(model_output)
     return embeddings.cpu().numpy()
 def pooling2(model_output, attention_mask):
     token_embeddings = model_output[0]
     input_mask_expanded = (
         input_mask_expanded.sum(1), min=1e-9
     )
 def compute_embeddings2(list_of_strings):
     encoded_input = tokenizers[1](
         list_of_strings, padding=True, truncation=True, return_tensors="pt"
     sentence_embeddings = pooling2(model_output, encoded_input["attention_mask"])
     return F.normalize(sentence_embeddings, p=2, dim=1).cpu().numpy()
 @st.cache(
     show_spinner=False,
     hash_funcs={Tokenizer: lambda _: None, AddedToken: lambda _: None},
     delay = "%.3f" % (time.time() - start)
     return f"<p><i>Computation time: {delay} seconds</i></p>{result}</ol>"
 st.sidebar.markdown(DESCRIPTION)
 model_choice = st.sidebar.selectbox("Similarity model", options=MODEL_OPTIONS)
 model_id = 0 if model_choice == MODEL_OPTIONS[0] else 1
 clicked = click_detector(semantic_search(query, model_id))
 if clicked != "":