Spaces:

anonauthors
/

SecretLanguage

Runtime error

App Files Files Community

anonymousauthors commited on Feb 17, 2023

Commit

8a8c82c

•

1 Parent(s): b53f7e8

Update pages/2_😈_BlackBox_and_WhiteBox_Attacks.py

Browse files

Files changed (1) hide show

pages/2_😈_BlackBox_and_WhiteBox_Attacks.py +7 -7

pages/2_😈_BlackBox_and_WhiteBox_Attacks.py CHANGED Viewed

@@ -25,12 +25,12 @@ st.sidebar.markdown('`Input text`: a sentence or paragraph.')
 st.sidebar.markdown('`Number of replacements`: the number of secret language samples.')
 st.sidebar.markdown('`Steps for searching Secret Langauge`: the steps in the SecretFinding process.')
 st.sidebar.markdown('#### Two methods')
-st.sidebar.markdown('1. Searching secret languages based on models: this method calculates secret languages using [gpt2-medium](https://huggingface.co/gpt2-medium), [EleutherAI/gpt-neo-1.3B](https://huggingface.co/EleutherAI/gpt-neo-1.3B)') #, [EleutherAI/gpt-neo-2.7B](https://huggingface.co/EleutherAI/gpt-neo-2.7B), [EleutherAI/gpt-neox-20b](https://huggingface.co/EleutherAI/gpt-neox-20b), or [EleutherAI/gpt-j-6B](https://huggingface.co/EleutherAI/gpt-j-6B).')
 st.sidebar.markdown('2. Use the secret language we found on ALBERT, DistillBERT, and Roberta: this method replaces words directly with the secret language dictionary derived from ALBERT, DistillBERT, and Roberta.')
 st.sidebar.markdown('#### Return')
 st.sidebar.markdown(
-    'To see whether the whitebox attack works on LLMs (gpt2-medium and EleutherAI/gpt-neo-1.3B), we set random seeds to 0 and present the responses.'
     )
 st.sidebar.markdown(
     'To see whether the blackbox attack works on LLMs, we also add the response using [Codex](https://openai.com/blog/openai-codex/). '
@@ -264,8 +264,8 @@ title = st.text_area('Input text.', 'Which name is also used to describe the Ama
 if option == 'Searching secret languages based on models':
     model_choice = st.selectbox(
         'Which model you would like to use?',
-        # ('gpt2-medium', "EleutherAI/gpt-neo-1.3B", "EleutherAI/gpt-neo-2.7B", "EleutherAI/gpt-neox-20b", "EleutherAI/gpt-j-6B")
-        ('gpt2-medium', "EleutherAI/gpt-neo-1.3B")
     )
     _cols = st.columns(2)
     restarts = _cols[0].number_input('Number of replacements.', value=10, min_value=1, step=1, format='%d')
@@ -277,7 +277,7 @@ if button('Tokenize', key='tokenizer'):
     if option == 'Searching secret languages based on models':
         tokenizer = AutoTokenizer.from_pretrained(model_choice)
     else:
-        tokenizer = AutoTokenizer.from_pretrained('gpt2-medium')
     for key in st.session_state.keys():
         if key not in ['tokenizer', 'start'] and 'tokenizer_' not in key:
             del st.session_state[key]
@@ -318,7 +318,7 @@ if button('Tokenize', key='tokenizer'):
                 if not platform.system().lower() == 'darwin':
                     generator1 = pipeline('text-generation', model='EleutherAI/gpt-neo-1.3B')
             with st.expander('**Original input text**: '+ title):
-                    st.markdown(f'The response of gpt2-medium with the prompt :blue[{title}]')
                     st.markdown('<blockquote>' + generator(title, max_length=256, num_return_sequences=1)[0]['generated_text'].replace(title, '', 1) + '</blockquote>', unsafe_allow_html=True)
                     if not platform.system().lower() == 'darwin':
                         st.markdown(f'The response of EleutherAI/gpt-neo-1.3B with the prompt :blue[{title}]')
@@ -363,7 +363,7 @@ if button('Tokenize', key='tokenizer'):
             # st.markdown('<br>'.join(outputs), unsafe_allow_html=True)
             for i in range(restarts):
                 with st.expander(outputs[i]):
-                    st.markdown(f'The response of gpt2-medium with the prompt :blue[{outputs[i]}]')
                     st.markdown('<blockquote>' + generator(outputs[i], max_length=256, num_return_sequences=1)[0]['generated_text'].replace(title, '', 1) + '</blockquote>', unsafe_allow_html=True)
                     if not platform.system().lower() == 'darwin':
                         st.markdown(f'The response of EleutherAI/gpt-neo-1.3B with the prompt :blue[{outputs[i]}]')

 st.sidebar.markdown('`Number of replacements`: the number of secret language samples.')
 st.sidebar.markdown('`Steps for searching Secret Langauge`: the steps in the SecretFinding process.')
 st.sidebar.markdown('#### Two methods')
+st.sidebar.markdown('1. Searching secret languages based on models: this method calculates secret languages using [gpt2](https://huggingface.co/gpt2), [gpt-medium](https://huggingface.co/gpt2-medium), [EleutherAI/gpt-neo-1.3B](https://huggingface.co/EleutherAI/gpt-neo-1.3B)') #, [EleutherAI/gpt-neo-2.7B](https://huggingface.co/EleutherAI/gpt-neo-2.7B), [EleutherAI/gpt-neox-20b](https://huggingface.co/EleutherAI/gpt-neox-20b), or [EleutherAI/gpt-j-6B](https://huggingface.co/EleutherAI/gpt-j-6B).')
 st.sidebar.markdown('2. Use the secret language we found on ALBERT, DistillBERT, and Roberta: this method replaces words directly with the secret language dictionary derived from ALBERT, DistillBERT, and Roberta.')
 st.sidebar.markdown('#### Return')
 st.sidebar.markdown(
+    'To see whether the whitebox attack works on LLMs (gpt2 and EleutherAI/gpt-neo-1.3B), we set random seeds to 0 and present the responses.'
     )
 st.sidebar.markdown(
     'To see whether the blackbox attack works on LLMs, we also add the response using [Codex](https://openai.com/blog/openai-codex/). '
 if option == 'Searching secret languages based on models':
     model_choice = st.selectbox(
         'Which model you would like to use?',
+        # ('gpt2', "EleutherAI/gpt-neo-1.3B", "EleutherAI/gpt-neo-2.7B", "EleutherAI/gpt-neox-20b", "EleutherAI/gpt-j-6B")
+        ('gpt2', 'gpt-medium', "EleutherAI/gpt-neo-1.3B")
     )
     _cols = st.columns(2)
     restarts = _cols[0].number_input('Number of replacements.', value=10, min_value=1, step=1, format='%d')
     if option == 'Searching secret languages based on models':
         tokenizer = AutoTokenizer.from_pretrained(model_choice)
     else:
+        tokenizer = AutoTokenizer.from_pretrained('gpt2')
     for key in st.session_state.keys():
         if key not in ['tokenizer', 'start'] and 'tokenizer_' not in key:
             del st.session_state[key]
                 if not platform.system().lower() == 'darwin':
                     generator1 = pipeline('text-generation', model='EleutherAI/gpt-neo-1.3B')
             with st.expander('**Original input text**: '+ title):
+                    st.markdown(f'The response of gpt2 with the prompt :blue[{title}]')
                     st.markdown('<blockquote>' + generator(title, max_length=256, num_return_sequences=1)[0]['generated_text'].replace(title, '', 1) + '</blockquote>', unsafe_allow_html=True)
                     if not platform.system().lower() == 'darwin':
                         st.markdown(f'The response of EleutherAI/gpt-neo-1.3B with the prompt :blue[{title}]')
             # st.markdown('<br>'.join(outputs), unsafe_allow_html=True)
             for i in range(restarts):
                 with st.expander(outputs[i]):
+                    st.markdown(f'The response of gpt2 with the prompt :blue[{outputs[i]}]')
                     st.markdown('<blockquote>' + generator(outputs[i], max_length=256, num_return_sequences=1)[0]['generated_text'].replace(title, '', 1) + '</blockquote>', unsafe_allow_html=True)
                     if not platform.system().lower() == 'darwin':
                         st.markdown(f'The response of EleutherAI/gpt-neo-1.3B with the prompt :blue[{outputs[i]}]')