Upload folder using huggingface_hub

Browse files

Files changed (9) hide show

config.json +29 -0
config.yaml +208 -0
generation_config.json +7 -0
model.safetensors +3 -0
place-your-models-here.txt +0 -0
special_tokens_map.json +23 -0
tokenizer.json +0 -0
tokenizer.model +3 -0
tokenizer_config.json +42 -0

config.json ADDED Viewed

	@@ -0,0 +1,29 @@

+{
+  "_name_or_path": "/home/kearm/HF_FAST/TinyLlama_v1.1",
+  "architectures": [
+    "LlamaForCausalLM"
+  ],
+  "attention_bias": false,
+  "attention_dropout": 0.0,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "hidden_act": "silu",
+  "hidden_size": 2048,
+  "initializer_range": 0.02,
+  "intermediate_size": 5632,
+  "max_position_embeddings": 2048,
+  "mlp_bias": false,
+  "model_type": "llama",
+  "num_attention_heads": 32,
+  "num_hidden_layers": 22,
+  "num_key_value_heads": 4,
+  "pretraining_tp": 1,
+  "rms_norm_eps": 1e-05,
+  "rope_scaling": null,
+  "rope_theta": 10000.0,
+  "tie_word_embeddings": false,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.43.1",
+  "use_cache": true,
+  "vocab_size": 32000
+}

config.yaml ADDED Viewed

	@@ -0,0 +1,208 @@

+.*(llama|alpac|vicuna|guanaco|koala|llava|wizardlm|metharme|pygmalion-7b|pygmalion-2|mythalion|wizard-mega|openbuddy|vigogne|h2ogpt-research|manticore):
+  model_type: 'llama'
+.*(opt-|opt_|opt1|opt3|optfor|galactica|galpaca|pygmalion-350m):
+  model_type: 'opt'
+.*(gpt-j|gptj|gpt4all-j|malion-6b|pygway|pygmalion-6b|dolly-v1):
+  model_type: 'gptj'
+.*(gpt-neox|koalpaca-polyglot|polyglot.*koalpaca|polyglot-ko|polyglot_ko|pythia|stablelm|incite|dolly-v2|polycoder|h2ogpt-oig|h2ogpt-oasst1|h2ogpt-gm):
+  model_type: 'gptneox'
+.*bloom:
+  model_type: 'bloom'
+.*gpt2:
+  model_type: 'gpt2'
+.*falcon:
+  model_type: 'falcon'
+.*mpt:
+  model_type: 'mpt'
+.*(starcoder|starchat):
+  model_type: 'starcoder'
+.*dolly-v2:
+  model_type: 'dollyv2'
+.*replit:
+  model_type: 'replit'
+.*(oasst|openassistant-|stablelm-7b-sft-v7-epoch-3):
+  instruction_template: 'Open Assistant'
+  skip_special_tokens: false
+(?!.*galactica)(?!.*reward).*openassistant:
+  instruction_template: 'Open Assistant'
+  skip_special_tokens: false
+.*galactica:
+  skip_special_tokens: false
+.*dolly-v[0-9]-[0-9]*b:
+  instruction_template: 'Alpaca'
+  skip_special_tokens: false
+.*alpaca-native-4bit:
+  instruction_template: 'Alpaca'
+  custom_stopping_strings: '"### End"'
+.*llava:
+  instruction_template: 'LLaVA'
+  custom_stopping_strings: '"\n###"'
+.*llava.*1.5:
+  instruction_template: 'Vicuna-v1.1'
+.*wizard.*mega:
+  instruction_template: 'Wizard-Mega'
+  custom_stopping_strings: '"</s>"'
+.*starchat-beta:
+  instruction_template: 'Starchat-Beta'
+  custom_stopping_strings: '"<|end|>"'
+(?!.*v0)(?!.*1.1)(?!.*1_1)(?!.*stable)(?!.*chinese).*vicuna:
+  instruction_template: 'Vicuna-v0'
+.*vicuna.*v0:
+  instruction_template: 'Vicuna-v0'
+.*vicuna.*(1.1|1_1|1.3|1_3):
+  instruction_template: 'Vicuna-v1.1'
+.*vicuna.*(1.5|1_5):
+  instruction_template: 'Vicuna-v1.1'
+.*stable.*vicuna:
+  instruction_template: 'StableVicuna'
+(?!.*chat).*chinese-vicuna:
+  instruction_template: 'Alpaca'
+.*chinese-vicuna.*chat:
+  instruction_template: 'Chinese-Vicuna-Chat'
+.*alpaca:
+  instruction_template: 'Alpaca'
+.*koala:
+  instruction_template: 'Koala'
+.*chatglm:
+  instruction_template: 'ChatGLM'
+.*(metharme|pygmalion|mythalion):
+  instruction_template: 'Metharme'
+.*raven:
+  instruction_template: 'RWKV-Raven'
+.*moss-moon.*sft:
+  instruction_template: 'MOSS'
+.*stablelm-tuned:
+  instruction_template: 'StableLM'
+.*galactica.*finetuned:
+  instruction_template: 'Galactica Finetuned'
+.*galactica.*-v2:
+  instruction_template: 'Galactica v2'
+(?!.*finetuned)(?!.*-v2).*galactica:
+  instruction_template: 'Galactica'
+.*guanaco:
+  instruction_template: 'Guanaco non-chat'
+.*baize:
+  instruction_template: 'Baize'
+.*mpt-.*instruct:
+  instruction_template: 'Alpaca'
+.*mpt-.*chat:
+  instruction_template: 'ChatML'
+(?!.*-flan-)(?!.*-t5-).*lamini-:
+  instruction_template: 'Alpaca'
+.*incite.*chat:
+  instruction_template: 'INCITE-Chat'
+.*incite.*instruct:
+  instruction_template: 'INCITE-Instruct'
+.*ziya-:
+  instruction_template: 'Ziya'
+.*koalpaca:
+  instruction_template: 'KoAlpaca'
+.*openbuddy:
+  instruction_template: 'OpenBuddy'
+(?!.*chat).*vigogne:
+  instruction_template: 'Vigogne-Instruct'
+.*vigogne.*chat:
+  instruction_template: 'Vigogne-Chat'
+.*(llama-deus|supercot|llama-natural-instructions|open-llama-0.3t-7b-instruct-dolly-hhrlhf|open-llama-0.3t-7b-open-instruct):
+  instruction_template: 'Alpaca'
+.*bactrian:
+  instruction_template: 'Bactrian'
+.*(h2ogpt-oig-|h2ogpt-oasst1-|h2ogpt-research-oasst1-):
+  instruction_template: 'INCITE-Chat'
+.*h2ogpt-gm-:
+  instruction_template: 'H2O-prompt_answer'
+.*manticore:
+  instruction_template: 'Manticore Chat'
+.*bluemoonrp-(30|13)b:
+  instruction_template: 'Bluemoon'
+.*Nous-Hermes-13b:
+  instruction_template: 'Alpaca'
+.*airoboros:
+  instruction_template: 'Vicuna-v1.1'
+.*airoboros.*1.2:
+  instruction_template: 'Airoboros-v1.2'
+.*alpa(cino|sta):
+  instruction_template: 'Alpaca'
+.*hippogriff:
+  instruction_template: 'Hippogriff'
+.*lazarus:
+  instruction_template: 'Alpaca'
+.*guanaco-.*(7|13|33|65)b:
+  instruction_template: 'Vicuna-v0'
+.*hypermantis:
+  instruction_template: 'Alpaca'
+.*open-llama-.*-open-instruct:
+  instruction_template: 'Alpaca'
+.*starcoder-gpteacher-code-instruct:
+  instruction_template: 'Alpaca'
+.*tulu:
+  instruction_template: 'Tulu'
+.*chronos:
+  instruction_template: 'Alpaca'
+.*samantha:
+  instruction_template: 'Samantha'
+.*wizardcoder:
+  instruction_template: 'Alpaca'
+.*minotaur:
+  instruction_template: 'Manticore Chat'
+.*orca_mini:
+  instruction_template: 'Orca Mini'
+.*(platypus|gplatty|superplatty):
+  instruction_template: 'Alpaca'
+.*(openorca-platypus2):
+  instruction_template: 'OpenOrca-Platypus2'
+  custom_stopping_strings: '"### Instruction:", "### Response:"'
+.*longchat:
+  instruction_template: 'Vicuna-v1.1'
+.*vicuna-33b:
+  instruction_template: 'Vicuna-v1.1'
+.*redmond-hermes-coder:
+  instruction_template: 'Alpaca'
+.*wizardcoder-15b:
+  instruction_template: 'Alpaca'
+.*wizardlm:
+  instruction_template: 'Vicuna-v1.1'
+.*godzilla:
+  instruction_template: 'Alpaca'
+.*llama(-?)(2|v2).*chat:
+  instruction_template: 'Llama-v2'
+.*newhope:
+  instruction_template: 'NewHope'
+.*stablebeluga2:
+  instruction_template: 'StableBeluga2'
+.*openchat:
+  instruction_template: 'OpenChat'
+.*codellama.*instruct:
+  instruction_template: 'Llama-v2'
+.*(mistral|mixtral).*instruct:
+  instruction_template: 'Mistral'
+.*mistral.*openorca:
+  instruction_template: 'ChatML'
+.*(WizardCoder-Python-34B-V1.0|Phind-CodeLlama-34B-v2|CodeBooga-34B-v0.1):
+  instruction_template: 'Alpaca'
+.*orca-2-(13|7)b:
+  instruction_template: 'ChatML'
+.*openhermes.*mistral:
+  instruction_template: 'ChatML'
+.*Yi-34B-Chat:
+  instruction_template: 'ChatML'
+(dolphin).*:
+  instruction_template: 'ChatML'
+.*synthia:
+  instruction_template: 'Synthia'
+.*(hercules|hyperion):
+  instruction_template: 'ChatML'
+.*command-r:
+  instruction_template: 'Command-R'
+.*xwin-lm-70b-v0.1:
+  instruction_template: 'Vicuna-v1.1'
+.*platypus-yi-34b:
+  instruction_template: 'Vicuna-v1.1'
+.*CausalLM-RP-34B:
+  instruction_template: 'ChatML'
+34b-beta:
+  instruction_template: 'ChatML'
+.*airoboros-3_1-yi-34b-200k:
+  instruction_template: 'Llama-v2'
+.*chatqa:
+  instruction_template: 'NVIDIA-ChatQA'

generation_config.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "max_length": 2048,
+  "pad_token_id": 0,
+  "transformers_version": "4.43.1"
+}

model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:925af99bc725da7c18479fc0f146153497cb8a2dcc78ab9907cab96c47ae150f
+size 2200119864

place-your-models-here.txt ADDED Viewed

File without changes

special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,23 @@

+{
+  "bos_token": {
+    "content": "<s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "eos_token": {
+    "content": "</s>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  },
+  "unk_token": {
+    "content": "<unk>",
+    "lstrip": false,
+    "normalized": false,
+    "rstrip": false,
+    "single_word": false
+  }
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
+size 499723

tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,42 @@

+{
+  "add_bos_token": true,
+  "add_eos_token": false,
+  "add_prefix_space": null,
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "legacy": false,
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": null,
+  "padding_side": "right",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "LlamaTokenizer",
+  "unk_token": "<unk>",
+  "use_default_system_prompt": false
+}