Proprogrammer commited on Dec 7, 2025

Commit

ae9d625

verified ·

1 Parent(s): 0d7db3e

Proprogrammer/max-1

Files changed (19) hide show

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+combined_corpus.jsonl filter=lfs diff=lfs merge=lfs -text

README.md ADDED Viewed

+---
+library_name: transformers
+tags:
+- generated_from_trainer
+model-index:
+- name: full_llm_output
+  results: []
+---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# full_llm_output
+This model is a fine-tuned version of [](https://huggingface.co/) on the None dataset.
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 0.0002
+- train_batch_size: 1
+- eval_batch_size: 8
+- seed: 42
+- gradient_accumulation_steps: 16
+- total_train_batch_size: 16
+- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
+- lr_scheduler_type: linear
+- training_steps: 100
+- mixed_precision_training: Native AMP
+### Training results
+### Framework versions
+- Transformers 4.56.0
+- Pytorch 2.8.0+cu129
+- Datasets 4.4.1
+- Tokenizers 0.22.0

combined_corpus.jsonl ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:8e48264212456d2a40baf531d17e5b63d8285166d23c08547e008425d8d6fbb1
+size 264316958

config.json ADDED Viewed

+{
+  "activation_function": "gelu_new",
+  "architectures": [
+    "GPT2LMHeadModel"
+  ],
+  "attn_pdrop": 0.1,
+  "bos_token_id": 1,
+  "dtype": "float32",
+  "embd_pdrop": 0.1,
+  "eos_token_id": 2,
+  "initializer_range": 0.02,
+  "layer_norm_epsilon": 1e-05,
+  "model_type": "gpt2",
+  "n_ctx": 2048,
+  "n_embd": 832,
+  "n_head": 13,
+  "n_inner": null,
+  "n_layer": 12,
+  "n_positions": 2048,
+  "pad_token_id": 0,
+  "reorder_and_upcast_attn": false,
+  "resid_pdrop": 0.1,
+  "scale_attn_by_inverse_layer_idx": false,
+  "scale_attn_weights": true,
+  "summary_activation": null,
+  "summary_first_dropout": 0.1,
+  "summary_proj_to_labels": true,
+  "summary_type": "cls_index",
+  "summary_use_proj": true,
+  "transformers_version": "4.56.0",
+  "use_cache": true,
+  "vocab_size": 52000
+}

generation_config.json ADDED Viewed

+{
+  "_from_model_config": true,
+  "bos_token_id": 1,
+  "eos_token_id": 2,
+  "pad_token_id": 0,
+  "transformers_version": "4.56.0"
+}

hf_corpus/cache-09216fe8055d0e98.arrow ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:ad896171869f385baf40d239736f85d6ee9d4c816add4090e3dc7c47eb78a79a
+size 333626080

hf_corpus/cache-7ae6ee44d0d52703.arrow ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:02750fa8e7f172798e5be525dc95ca89a74b98c66327023bae253e7c4310ccd7
+size 651467768

hf_corpus/cache-865cd6218c9ced23.arrow ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:3413a096e9968390a3333ff960b651c89d8a94dd0a3ff2ff58f87beedd95d9fe
+size 221376

hf_corpus/data-00000-of-00001.arrow ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e6dc576a7947eb458c99ab962f9932f4714c076dca948a5ef3e5dee14dbe526
+size 259346416

hf_corpus/dataset_info.json ADDED Viewed

+{
+  "citation": "",
+  "description": "",
+  "features": {
+    "text": {
+      "dtype": "string",
+      "_type": "Value"
+    }
+  },
+  "homepage": "",
+  "license": ""
+}

hf_corpus/state.json ADDED Viewed

+{
+  "_data_files": [
+    {
+      "filename": "data-00000-of-00001.arrow"
+    }
+  ],
+  "_fingerprint": "66c916b8a72e4890",
+  "_format_columns": null,
+  "_format_kwargs": {},
+  "_format_type": null,
+  "_output_all_columns": false,
+  "_split": null
+}

hf_tokenizer_dir/special_tokens_map.json ADDED Viewed

+{
+  "bos_token": "<bos>",
+  "eos_token": "<eos>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

hf_tokenizer_dir/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

hf_tokenizer_dir/tokenizer_config.json ADDED Viewed

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<bos>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<eos>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<bos>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<eos>",
+  "extra_special_tokens": {},
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "tokenizer_class": "PreTrainedTokenizerFast",
+  "unk_token": "<unk>"
+}

model.safetensors ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:e8f3dfa813c4beb31513db895a523bbceca599572ea6df8c5bf07646292e3c30
+size 579133600

special_tokens_map.json ADDED Viewed

+{
+  "bos_token": "<bos>",
+  "eos_token": "<eos>",
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json ADDED Viewed

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<bos>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "<eos>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "bos_token": "<bos>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "<eos>",
+  "extra_special_tokens": {},
+  "model_max_length": 1000000000000000019884624838656,
+  "pad_token": "<pad>",
+  "tokenizer_class": "PreTrainedTokenizerFast",
+  "unk_token": "<unk>"
+}

training_args.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ce42b5fd0555a143cb08096a8161909e9228a718279840fa5d12f2b433e8d46
+size 5713