Spaces:

PetrovDE
/

HW_5_calc

Sleeping

App Files Files Community

PetrovDE commited on Nov 19, 2023

Commit

8b21bf3

•

1 Parent(s): 0637def

Add app and some data to model

Browse files

Files changed (8) hide show

app.py +166 -0
chkp/adapter_config.json +20 -0
chkp/adapter_model.bin +3 -0
chkp/optimizer.pt +3 -0
chkp/rng_state.pth +3 -0
chkp/scheduler.pt +3 -0
chkp/trainer_state.json +349 -0
chkp/training_args.bin +3 -0

app.py ADDED Viewed

	@@ -0,0 +1,166 @@

+import os
+import sys
+import fire
+import gradio as gr
+import torch
+import transformers
+from peft import PeftModel
+from transformers import GenerationConfig, LlamaForCausalLM, LlamaTokenizer
+from typing import Union
+import re
+class Prompter(object):
+    def generate_prompt(
+        self,
+        instruction: str,
+        label: Union[None, str] = None,
+    ) -> str:
+        res = f"{instruction}\nAnswer: "
+        if label:
+            res = f"{res}{label}"
+        return res
+    def get_response(self, output: str) -> str:
+        return (
+            output.split("Answer:")[1]
+            .strip()
+            .replace("/", "\u00F7")
+            .replace("*", "\u00D7")
+        )
+load_8bit = True  # for Colab
+base_model = "baffo32/decapoda-research-llama-7B-hf"
+lora_weights = "tiedong/goat-lora-7b"
+share_gradio = True
+if torch.cuda.is_available():
+    device = "cuda"
+else:
+    device = "cpu"
+try:
+    if torch.backends.mps.is_available():
+        device = "mps"
+except:
+    pass
+prompter = Prompter()
+tokenizer = LlamaTokenizer.from_pretrained("hf-internal-testing/llama-tokenizer")
+if device == "cuda":
+    model = LlamaForCausalLM.from_pretrained(
+        base_model,
+        load_in_8bit=load_8bit,
+        torch_dtype=torch.float16,
+        device_map="auto",
+    )
+    model = PeftModel.from_pretrained(
+        model,
+        lora_weights,
+        torch_dtype=torch.float16,
+        device_map={"": 0},
+    )
+elif device == "mps":
+    model = LlamaForCausalLM.from_pretrained(
+        base_model,
+        device_map={"": device},
+        torch_dtype=torch.float16,
+    )
+    model = PeftModel.from_pretrained(
+        model,
+        lora_weights,
+        device_map={"": device},
+        torch_dtype=torch.float16,
+    )
+else:
+    model = LlamaForCausalLM.from_pretrained(
+        base_model, device_map={"": device}, low_cpu_mem_usage=True
+    )
+    model = PeftModel.from_pretrained(
+        model,
+        lora_weights,
+        device_map={"": device},
+    )
+if not load_8bit:
+    model.half()
+model.eval()
+if torch.__version__ >= "2" and sys.platform != "win32":
+    model = torch.compile(model)
+def evaluate(
+    instruction,
+    temperature=0.1,
+    top_p=0.75,
+    top_k=40,
+    num_beams=4,
+    max_new_tokens=512,
+    stream_output=True,
+    **kwargs,
+):
+    prompt = prompter.generate_prompt(instruction)
+    inputs = tokenizer(prompt, return_tensors="pt")
+    input_ids = inputs["input_ids"].to(device)
+    generation_config = GenerationConfig(
+        temperature=temperature,
+        top_p=top_p,
+        top_k=top_k,
+        num_beams=num_beams,
+        **kwargs,
+    )
+    generate_params = {
+        "input_ids": input_ids,
+        "generation_config": generation_config,
+        "return_dict_in_generate": True,
+        "output_scores": True,
+        "max_new_tokens": max_new_tokens,
+    }
+    # Without streaming
+    with torch.no_grad():
+        generation_output = model.generate(
+            input_ids=input_ids,
+            generation_config=generation_config,
+            return_dict_in_generate=True,
+            output_scores=True,
+            max_new_tokens=max_new_tokens,
+        )
+    s = generation_output.sequences[0]
+    output = tokenizer.decode(s, skip_special_tokens=True).strip()
+    yield prompter.get_response(output)
+gr.Interface(
+    fn=evaluate,
+    inputs=[
+        gr.components.Textbox(
+            lines=1,
+            label="Arithmetic",
+            placeholder="What is 63303235 + 20239503",
+        ),
+        gr.components.Slider(minimum=0, maximum=1, value=0.1, label="Temperature"),
+        gr.components.Slider(minimum=0, maximum=1, value=0.75, label="Top p"),
+        gr.components.Slider(minimum=0, maximum=100, step=1, value=40, label="Top k"),
+        gr.components.Slider(minimum=1, maximum=4, step=1, value=4, label="Beams"),
+        gr.components.Slider(
+            minimum=1, maximum=1024, step=1, value=512, label="Max tokens"
+        ),
+    ],
+    outputs=[
+        gr.Textbox(
+            lines=5,
+            label="Output",
+        )
+    ],
+    title="test model",
+    description="Это пример реализации из goat",  # noqa: E501
+).queue().launch(share=share_gradio)

chkp/adapter_config.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "base_model_name_or_path": "nickypro/tinyllama-15M",
+  "bias": "none",
+  "enable_lora": null,
+  "fan_in_fan_out": false,
+  "inference_mode": true,
+  "lora_alpha": 64,
+  "lora_dropout": 0.05,
+  "merge_weights": false,
+  "modules_to_save": null,
+  "peft_type": "LORA",
+  "r": 64,
+  "target_modules": [
+    "q_proj",
+    "v_proj",
+    "k_proj",
+    "o_proj"
+  ],
+  "task_type": "CAUSAL_LM"
+}

chkp/adapter_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49891d6a9e5d6098f4048189ae2bf4df53022b58c7689f25da4e6b9c481a018a
+size 3556350

chkp/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e68114a0c0afc9a77f9bd91ed114283dc2093c3bf42383e62897601f2b4f8129
+size 7118586

chkp/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cb69e610873a8142e0245cca374768d45ddb50a0c4891436e6dbf04d069a7122
+size 14244

chkp/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:90ba5da359c992d8f0dc912ca51bea8184b55a457a5f5fdfc7bc2702765e7d0d
+size 1064

chkp/trainer_state.json ADDED Viewed

	@@ -0,0 +1,349 @@

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 0.23157894736842105,
+  "eval_steps": 500,
+  "global_step": 550,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.0,
+      "learning_rate": 1e-05,
+      "loss": 4.8744,
+      "step": 10
+    },
+    {
+      "epoch": 0.01,
+      "learning_rate": 2e-05,
+      "loss": 4.1114,
+      "step": 20
+    },
+    {
+      "epoch": 0.01,
+      "learning_rate": 3e-05,
+      "loss": 3.528,
+      "step": 30
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 4e-05,
+      "loss": 3.2573,
+      "step": 40
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 5e-05,
+      "loss": 3.1417,
+      "step": 50
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 6e-05,
+      "loss": 3.0506,
+      "step": 60
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 7e-05,
+      "loss": 2.9644,
+      "step": 70
+    },
+    {
+      "epoch": 0.03,
+      "learning_rate": 8e-05,
+      "loss": 2.8399,
+      "step": 80
+    },
+    {
+      "epoch": 0.04,
+      "learning_rate": 9e-05,
+      "loss": 2.6935,
+      "step": 90
+    },
+    {
+      "epoch": 0.04,
+      "learning_rate": 0.0001,
+      "loss": 2.5259,
+      "step": 100
+    },
+    {
+      "epoch": 0.05,
+      "learning_rate": 9.956043956043956e-05,
+      "loss": 2.3713,
+      "step": 110
+    },
+    {
+      "epoch": 0.05,
+      "learning_rate": 9.912087912087913e-05,
+      "loss": 2.2237,
+      "step": 120
+    },
+    {
+      "epoch": 0.05,
+      "learning_rate": 9.868131868131869e-05,
+      "loss": 2.0999,
+      "step": 130
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 9.824175824175824e-05,
+      "loss": 2.0211,
+      "step": 140
+    },
+    {
+      "epoch": 0.06,
+      "learning_rate": 9.780219780219781e-05,
+      "loss": 1.949,
+      "step": 150
+    },
+    {
+      "epoch": 0.07,
+      "learning_rate": 9.736263736263737e-05,
+      "loss": 1.8819,
+      "step": 160
+    },
+    {
+      "epoch": 0.07,
+      "learning_rate": 9.692307692307692e-05,
+      "loss": 1.8244,
+      "step": 170
+    },
+    {
+      "epoch": 0.08,
+      "learning_rate": 9.64835164835165e-05,
+      "loss": 1.7849,
+      "step": 180
+    },
+    {
+      "epoch": 0.08,
+      "learning_rate": 9.604395604395605e-05,
+      "loss": 1.7288,
+      "step": 190
+    },
+    {
+      "epoch": 0.08,
+      "learning_rate": 9.560439560439561e-05,
+      "loss": 1.6914,
+      "step": 200
+    },
+    {
+      "epoch": 0.09,
+      "learning_rate": 9.516483516483517e-05,
+      "loss": 1.6534,
+      "step": 210
+    },
+    {
+      "epoch": 0.09,
+      "learning_rate": 9.472527472527473e-05,
+      "loss": 1.6332,
+      "step": 220
+    },
+    {
+      "epoch": 0.1,
+      "learning_rate": 9.428571428571429e-05,
+      "loss": 1.5944,
+      "step": 230
+    },
+    {
+      "epoch": 0.1,
+      "learning_rate": 9.384615384615386e-05,
+      "loss": 1.5789,
+      "step": 240
+    },
+    {
+      "epoch": 0.11,
+      "learning_rate": 9.340659340659341e-05,
+      "loss": 1.5583,
+      "step": 250
+    },
+    {
+      "epoch": 0.11,
+      "learning_rate": 9.296703296703297e-05,
+      "loss": 1.5485,
+      "step": 260
+    },
+    {
+      "epoch": 0.11,
+      "learning_rate": 9.252747252747253e-05,
+      "loss": 1.5124,
+      "step": 270
+    },
+    {
+      "epoch": 0.12,
+      "learning_rate": 9.208791208791209e-05,
+      "loss": 1.5004,
+      "step": 280
+    },
+    {
+      "epoch": 0.12,
+      "learning_rate": 9.164835164835165e-05,
+      "loss": 1.5042,
+      "step": 290
+    },
+    {
+      "epoch": 0.13,
+      "learning_rate": 9.12087912087912e-05,
+      "loss": 1.4991,
+      "step": 300
+    },
+    {
+      "epoch": 0.13,
+      "learning_rate": 9.076923076923078e-05,
+      "loss": 1.4692,
+      "step": 310
+    },
+    {
+      "epoch": 0.13,
+      "learning_rate": 9.032967032967033e-05,
+      "loss": 1.4628,
+      "step": 320
+    },
+    {
+      "epoch": 0.14,
+      "learning_rate": 8.989010989010989e-05,
+      "loss": 1.4481,
+      "step": 330
+    },
+    {
+      "epoch": 0.14,
+      "learning_rate": 8.945054945054946e-05,
+      "loss": 1.454,
+      "step": 340
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 8.901098901098901e-05,
+      "loss": 1.4409,
+      "step": 350
+    },
+    {
+      "epoch": 0.15,
+      "learning_rate": 8.857142857142857e-05,
+      "loss": 1.4339,
+      "step": 360
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 8.813186813186814e-05,
+      "loss": 1.4262,
+      "step": 370
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 8.76923076923077e-05,
+      "loss": 1.4298,
+      "step": 380
+    },
+    {
+      "epoch": 0.16,
+      "learning_rate": 8.725274725274725e-05,
+      "loss": 1.4247,
+      "step": 390
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 8.681318681318682e-05,
+      "loss": 1.4191,
+      "step": 400
+    },
+    {
+      "epoch": 0.17,
+      "learning_rate": 8.637362637362638e-05,
+      "loss": 1.4156,
+      "step": 410
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 8.593406593406593e-05,
+      "loss": 1.4102,
+      "step": 420
+    },
+    {
+      "epoch": 0.18,
+      "learning_rate": 8.54945054945055e-05,
+      "loss": 1.4121,
+      "step": 430
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 8.505494505494506e-05,
+      "loss": 1.4033,
+      "step": 440
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 8.461538461538461e-05,
+      "loss": 1.3986,
+      "step": 450
+    },
+    {
+      "epoch": 0.19,
+      "learning_rate": 8.417582417582419e-05,
+      "loss": 1.3935,
+      "step": 460
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 8.373626373626374e-05,
+      "loss": 1.399,
+      "step": 470
+    },
+    {
+      "epoch": 0.2,
+      "learning_rate": 8.32967032967033e-05,
+      "loss": 1.3888,
+      "step": 480
+    },
+    {
+      "epoch": 0.21,
+      "learning_rate": 8.285714285714287e-05,
+      "loss": 1.3958,
+      "step": 490
+    },
+    {
+      "epoch": 0.21,
+      "learning_rate": 8.241758241758242e-05,
+      "loss": 1.3758,
+      "step": 500
+    },
+    {
+      "epoch": 0.21,
+      "learning_rate": 8.197802197802198e-05,
+      "loss": 1.3779,
+      "step": 510
+    },
+    {
+      "epoch": 0.22,
+      "learning_rate": 8.153846153846155e-05,
+      "loss": 1.3754,
+      "step": 520
+    },
+    {
+      "epoch": 0.22,
+      "learning_rate": 8.10989010989011e-05,
+      "loss": 1.3754,
+      "step": 530
+    },
+    {
+      "epoch": 0.23,
+      "learning_rate": 8.065934065934066e-05,
+      "loss": 1.3854,
+      "step": 540
+    },
+    {
+      "epoch": 0.23,
+      "learning_rate": 8.021978021978022e-05,
+      "loss": 1.3579,
+      "step": 550
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 2375,
+  "num_train_epochs": 1,
+  "save_steps": 50,
+  "total_flos": 271592074027008.0,
+  "trial_name": null,
+  "trial_params": null
+}

chkp/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6f2106e8a7b7aaf8d6c8f70689f1a1f3239d79f9126f142a9ce1a3ba53c11449
+size 4536