Spaces:

dar-tau
/

selfie

Running on Zero

App Files Files Community

dar-tau commited on Apr 11, 2024

Commit

79df09c

•

1 Parent(s): d6ead9d

Update app.py

Browse files

Files changed (1) hide show

app.py +2 -45

app.py CHANGED Viewed

@@ -11,55 +11,12 @@ from datasets import load_dataset
 from ctransformers import AutoModelForCausalLM as CAutoModelForCausalLM
 from transformers import PreTrainedModel, PreTrainedTokenizer, AutoModelForCausalLM, AutoTokenizer
 from interpret import InterpretationPrompt
 MAX_PROMPT_TOKENS = 60
 MAX_NUM_LAYERS = 50
-## info
-dataset_info = [
-                {'name': 'Commonsense', 'hf_repo': 'tau/commonsense_qa', 'text_col': 'question'},
-                {'name': 'Factual Recall', 'hf_repo': 'azhx/counterfact-filtered-gptj6b', 'text_col': 'subject+predicate',
-                 'filter': lambda x: x['label'] == 1},
-                # {'name': 'Physical Understanding', 'hf_repo': 'piqa', 'text_col': 'goal'},
-                {'name': 'Social Reasoning', 'hf_repo': 'ProlificAI/social-reasoning-rlhf', 'text_col': 'question'}
-               ]
-model_info = {
-    'LLAMA2-7B': dict(model_path='meta-llama/Llama-2-7b-chat-hf', device_map='cpu', token=os.environ['hf_token'],
-                                          original_prompt_template='<s>{prompt}',
-                                          interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
-                                         ), # , load_in_8bit=True
-    # 'Gemma-2B': dict(model_path='google/gemma-2b', device_map='cpu', token=os.environ['hf_token'],
-    #                         original_prompt_template='<bos>{prompt}',
-    #                         interpretation_prompt_template='<bos>User: [X]\n\nAnswer: {prompt}',
-    #                        ),
-    'Mistral-7B Instruct': dict(model_path='mistralai/Mistral-7B-Instruct-v0.2', device_map='cpu',
-                                               original_prompt_template='<s>{prompt}',
-                                               interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
-                                              ),
-    # 'TheBloke/Mistral-7B-Instruct-v0.2-GGUF': dict(model_file='mistral-7b-instruct-v0.2.Q5_K_S.gguf',
-    #                                                tokenizer='mistralai/Mistral-7B-Instruct-v0.2',
-    #                                                model_type='llama', hf=True, ctransformers=True,
-    #                                                original_prompt_template='<s>[INST] {prompt} [/INST]',
-    #                                                interpretation_prompt_template='<s>[INST] [X] [/INST] {prompt}',
-    #                                               )
-        }
-suggested_interpretation_prompts = [
-                                    "Sure, here's a bullet list of the key words in your message:",
-                                    "Sure, I'll summarize your message:",
-                                    "Sure, here are the words in your message:",
-                                    "Before responding, let me repeat the message you wrote:",
-                                    "Let me repeat the message:"
-                                   ]
 @dataclass
 class GlobalState:
     tokenizer : Optional[PreTrainedTokenizer] = None

 from ctransformers import AutoModelForCausalLM as CAutoModelForCausalLM
 from transformers import PreTrainedModel, PreTrainedTokenizer, AutoModelForCausalLM, AutoTokenizer
 from interpret import InterpretationPrompt
+from configs import model_info, dataset_info
 MAX_PROMPT_TOKENS = 60
 MAX_NUM_LAYERS = 50
 @dataclass
 class GlobalState:
     tokenizer : Optional[PreTrainedTokenizer] = None