update

Browse files

Files changed (6) hide show

.gitattributes +1 -0
README.md +105 -0
config.json +2 -2
special_tokens_map.json +6 -0
tokenizer.json +3 -0
tokenizer_config.json +10 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+tokenizer.json filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

	@@ -0,0 +1,105 @@

+---
+datasets:
+- Local
+license: bigscience-bloom-rail-1.0
+language:
+- id
+pipeline_tag: text-generation
+---
+#  Table of Contents
+1. [Model Summary](#model-summary)
+2. [Use](#use)
+3. [Limitations](#limitations)
+4. [Training](#training)
+5. [Evaluation](#evaluation)
+7. [Citation](#citation)
+# Model Summary
+> We present KARINA, finetuned from BLOOMZ bigscience/bloomz-3b, a family of models capable of following human instructions in dozens of languages zero-shot. We finetune BLOOMZ pretrained multilingual language models on our crosslingual task mixture (xP3) and find the resulting models capable of crosslingual generalization to unseen tasks & languages.
+# Use
+## Intended use
+We recommend using the model to perform tasks expressed in natural language. For example, given the prompt "*prompt = f"Given the question:\n{{ siapa kamu? }}\n---\nAnswer:\n"*", the model will most likely answer "*Saya Karina. Ada yang bisa saya bantu?*".
+## How to use
+### CPU
+<details>
+<summary> Click to expand </summary>
+```python
+# pip install -q transformers
+from transformers import AutoModelForCausalLM, AutoTokenizer
+checkpoint = "yodi/karina"
+tokenizer = AutoTokenizer.from_pretrained(checkpoint)
+model = AutoModelForCausalLM.from_pretrained(checkpoint)
+inputs = tokenizer.encode("Given the question:\n{{ siapa kamu? }}\n---\nAnswer:\n", return_tensors="pt")
+outputs = model.generate(inputs)
+print(tokenizer.decode(outputs[0]))
+```
+</details>
+### GPU
+<details>
+<summary> Click to expand </summary>
+```python
+# pip install -q transformers accelerate
+from transformers import AutoModelForCausalLM, AutoTokenizer
+checkpoint = "yodi/karina"
+tokenizer = AutoTokenizer.from_pretrained(checkpoint)
+model = AutoModelForCausalLM.from_pretrained(checkpoint, torch_dtype="auto", device_map="auto")
+inputs = tokenizer.encode("Given the question:\n{{ siapa kamu? }}\n---\nAnswer:\n", return_tensors="pt").to("cuda")
+outputs = model.generate(inputs)
+print(tokenizer.decode(outputs[0]))
+```
+</details>
+### GPU in 8bit
+<details>
+<summary> Click to expand </summary>
+```python
+# pip install -q transformers accelerate bitsandbytes
+from transformers import AutoModelForCausalLM, AutoTokenizer
+checkpoint = "yodi/karina"
+tokenizer = AutoTokenizer.from_pretrained(checkpoint)
+model = AutoModelForCausalLM.from_pretrained(checkpoint, device_map="auto", load_in_8bit=True)
+inputs = tokenizer.encode("Given the question:\n{{ siapa kamu? }}\n---\nAnswer:\n", return_tensors="pt").to("cuda")
+outputs = model.generate(inputs)
+print(tokenizer.decode(outputs[0]))
+```
+</details>
+<!-- Necessary for whitespace -->
+###
+# Limitations
+**Prompt Engineering:** The performance may vary depending on the prompt and its following BLOOMZ models.
+# Training
+## Model
+- **Architecture:** Same as [bloom](https://huggingface.co/bigscience/bloom), also refer to the `config.json` file

config.json CHANGED Viewed

@@ -1,5 +1,5 @@
 {
-  "_name_or_path": "outputs/model/",
   "apply_residual_connection_post_layernorm": false,
   "architectures": [
     "BloomForCausalLM"
@@ -25,7 +25,7 @@
   "skip_bias_add": true,
   "skip_bias_add_qkv": false,
   "slow_but_exact": false,
-  "torch_dtype": "bfloat16",
   "transformers_version": "4.31.0",
   "unk_token_id": 0,
   "use_cache": true,

 {
+  "_name_or_path": "bigscience/bloomz-3b",
   "apply_residual_connection_post_layernorm": false,
   "architectures": [
     "BloomForCausalLM"
   "skip_bias_add": true,
   "skip_bias_add_qkv": false,
   "slow_but_exact": false,
+  "torch_dtype": "float16",
   "transformers_version": "4.31.0",
   "unk_token_id": 0,
   "use_cache": true,

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

tokenizer.json ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:17a208233d2ee8d8c83b23bc214df737c44806a1919f444e89b31e586cd956ba
+size 14500471

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "add_prefix_space": false,
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "tokenizer_class": "BloomTokenizer",
+  "unk_token": "<unk>"
+}