Add Beta Version ./dataset/dataset_prompt_summary-gpt_Sample.json
Browse files- .gitattributes +7 -32
- README.md +22 -0
- config.json +77 -0
- dataset/dataset_CLIP.json +0 -0
- dataset/dataset_prompt_summary-gpt_Sample.json +0 -0
- dataset/dataset_test.json +16 -0
- generation_config.json +16 -0
- merges.txt +0 -0
- model.safetensors +3 -0
- tokenizer_config.json +1 -0
- vocab.json +0 -0
.gitattributes
CHANGED
@@ -1,35 +1,10 @@
|
|
1 |
-
*.
|
2 |
-
*.
|
3 |
*.bin filter=lfs diff=lfs merge=lfs -text
|
4 |
-
*.bz2 filter=lfs diff=lfs merge=lfs -text
|
5 |
-
*.ckpt filter=lfs diff=lfs merge=lfs -text
|
6 |
-
*.ftz filter=lfs diff=lfs merge=lfs -text
|
7 |
-
*.gz filter=lfs diff=lfs merge=lfs -text
|
8 |
*.h5 filter=lfs diff=lfs merge=lfs -text
|
9 |
-
*.joblib filter=lfs diff=lfs merge=lfs -text
|
10 |
-
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
11 |
-
*.mlmodel filter=lfs diff=lfs merge=lfs -text
|
12 |
-
*.model filter=lfs diff=lfs merge=lfs -text
|
13 |
-
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
14 |
-
*.npy filter=lfs diff=lfs merge=lfs -text
|
15 |
-
*.npz filter=lfs diff=lfs merge=lfs -text
|
16 |
-
*.onnx filter=lfs diff=lfs merge=lfs -text
|
17 |
-
*.ot filter=lfs diff=lfs merge=lfs -text
|
18 |
-
*.parquet filter=lfs diff=lfs merge=lfs -text
|
19 |
-
*.pb filter=lfs diff=lfs merge=lfs -text
|
20 |
-
*.pickle filter=lfs diff=lfs merge=lfs -text
|
21 |
-
*.pkl filter=lfs diff=lfs merge=lfs -text
|
22 |
-
*.pt filter=lfs diff=lfs merge=lfs -text
|
23 |
-
*.pth filter=lfs diff=lfs merge=lfs -text
|
24 |
-
*.rar filter=lfs diff=lfs merge=lfs -text
|
25 |
-
*.safetensors filter=lfs diff=lfs merge=lfs -text
|
26 |
-
saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
27 |
-
*.tar.* filter=lfs diff=lfs merge=lfs -text
|
28 |
-
*.tar filter=lfs diff=lfs merge=lfs -text
|
29 |
*.tflite filter=lfs diff=lfs merge=lfs -text
|
30 |
-
*.
|
31 |
-
*.
|
32 |
-
*.
|
33 |
-
*.
|
34 |
-
|
35 |
-
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
1 |
+
*.bin.* filter=lfs diff=lfs merge=lfs -text
|
2 |
+
*.lfs.* filter=lfs diff=lfs merge=lfs -text
|
3 |
*.bin filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
4 |
*.h5 filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5 |
*.tflite filter=lfs diff=lfs merge=lfs -text
|
6 |
+
*.tar.gz filter=lfs diff=lfs merge=lfs -text
|
7 |
+
*.ot filter=lfs diff=lfs merge=lfs -text
|
8 |
+
*.onnx filter=lfs diff=lfs merge=lfs -text
|
9 |
+
*.msgpack filter=lfs diff=lfs merge=lfs -text
|
10 |
+
model.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
README.md
ADDED
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
language: en
|
3 |
+
tags:
|
4 |
+
- summarization
|
5 |
+
license: apache-2.0
|
6 |
+
metrics:
|
7 |
+
- rouge
|
8 |
+
model-index:
|
9 |
+
- name: distilbart-cnn-12-6-finetuned-weaksup-1000
|
10 |
+
results: []
|
11 |
+
datasets:
|
12 |
+
- sengunsipahi/civitai_top10k
|
13 |
+
thumbnail: https://huggingface.co/front/thumbnails/distilbart_medium.png
|
14 |
+
---
|
15 |
+
|
16 |
+
### Usage
|
17 |
+
|
18 |
+
This checkpoint should be loaded into `BartForConditionalGeneration.from_pretrained`. See the [BART docs](https://huggingface.co/transformers/model_doc/bart.html?#transformers.BartForConditionalGeneration) for more information.
|
19 |
+
|
20 |
+
# distilbart-cnn-12-6-SD-prompt
|
21 |
+
|
22 |
+
This model is a [fine-tuned](https://pastebin.com/DTZ0WRz6) version of [sshleifer/distilbart-cnn-12-6](https://huggingface.co/sshleifer/distilbart-cnn-12-6) on an [dataset](https://huggingface.co/Nekochu/distilbart-cnn-12-6-SD-prompt/blob/main/dataset/dataset_CLIP.json), [modified](https://pastebin.com/6CVe3PMS) to be semi-synthetic by LLMs for summary Stable Diffusion Prompts.
|
config.json
ADDED
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "sshleifer/distilbart-cnn-12-6",
|
3 |
+
"_num_labels": 3,
|
4 |
+
"activation_dropout": 0.0,
|
5 |
+
"activation_function": "gelu",
|
6 |
+
"add_bias_logits": false,
|
7 |
+
"add_final_layer_norm": false,
|
8 |
+
"architectures": [
|
9 |
+
"BartForConditionalGeneration"
|
10 |
+
],
|
11 |
+
"attention_dropout": 0.0,
|
12 |
+
"bos_token_id": 0,
|
13 |
+
"classif_dropout": 0.0,
|
14 |
+
"classifier_dropout": 0.0,
|
15 |
+
"d_model": 1024,
|
16 |
+
"decoder_attention_heads": 16,
|
17 |
+
"decoder_ffn_dim": 4096,
|
18 |
+
"decoder_layerdrop": 0.0,
|
19 |
+
"decoder_layers": 6,
|
20 |
+
"decoder_start_token_id": 2,
|
21 |
+
"dropout": 0.1,
|
22 |
+
"early_stopping": true,
|
23 |
+
"encoder_attention_heads": 16,
|
24 |
+
"encoder_ffn_dim": 4096,
|
25 |
+
"encoder_layerdrop": 0.0,
|
26 |
+
"encoder_layers": 12,
|
27 |
+
"eos_token_id": 2,
|
28 |
+
"extra_pos_embeddings": 2,
|
29 |
+
"force_bos_token_to_be_generated": true,
|
30 |
+
"forced_bos_token_id": 0,
|
31 |
+
"forced_eos_token_id": 2,
|
32 |
+
"gradient_checkpointing": false,
|
33 |
+
"id2label": {
|
34 |
+
"0": "LABEL_0",
|
35 |
+
"1": "LABEL_1",
|
36 |
+
"2": "LABEL_2"
|
37 |
+
},
|
38 |
+
"init_std": 0.02,
|
39 |
+
"is_encoder_decoder": true,
|
40 |
+
"label2id": {
|
41 |
+
"LABEL_0": 0,
|
42 |
+
"LABEL_1": 1,
|
43 |
+
"LABEL_2": 2
|
44 |
+
},
|
45 |
+
"length_penalty": 2.0,
|
46 |
+
"max_length": 142,
|
47 |
+
"max_position_embeddings": 1024,
|
48 |
+
"min_length": 56,
|
49 |
+
"model_type": "bart",
|
50 |
+
"no_repeat_ngram_size": 3,
|
51 |
+
"normalize_before": false,
|
52 |
+
"normalize_embedding": true,
|
53 |
+
"num_beams": 4,
|
54 |
+
"num_hidden_layers": 12,
|
55 |
+
"output_past": true,
|
56 |
+
"pad_token_id": 1,
|
57 |
+
"prefix": " ",
|
58 |
+
"replacing_rate": 0,
|
59 |
+
"scale_embedding": false,
|
60 |
+
"static_position_embeddings": false,
|
61 |
+
"student_decoder_layers": null,
|
62 |
+
"student_encoder_layers": null,
|
63 |
+
"task_specific_params": {
|
64 |
+
"summarization": {
|
65 |
+
"early_stopping": true,
|
66 |
+
"length_penalty": 2.0,
|
67 |
+
"max_length": 142,
|
68 |
+
"min_length": 56,
|
69 |
+
"no_repeat_ngram_size": 3,
|
70 |
+
"num_beams": 4
|
71 |
+
}
|
72 |
+
},
|
73 |
+
"torch_dtype": "float32",
|
74 |
+
"transformers_version": "4.38.1",
|
75 |
+
"use_cache": true,
|
76 |
+
"vocab_size": 50264
|
77 |
+
}
|
dataset/dataset_CLIP.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
dataset/dataset_prompt_summary-gpt_Sample.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
dataset/dataset_test.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"input_ids": [
|
3 |
+
"The Eiffel Tower is a wrought-iron lattice tower on the Champ de Mars in Paris, France. It is named after the engineer Gustave Eiffel, whose company designed and built the tower.",
|
4 |
+
"Python is an interpreted, high-level, general-purpose programming language. Created by Guido van Rossum and first released in 1991, Python's design philosophy emphasizes code readability with its notable use of significant whitespace.",
|
5 |
+
"The Mona Lisa is a half-length portrait painting by Italian artist Leonardo da Vinci. Considered an archetypal masterpiece of the Italian Renaissance, it has been described as 'the best known, the most visited, the most written about, the most sung about, the most parodied work of art in the world.'",
|
6 |
+
"The Great Wall of China is a series of fortifications that were built across the historical northern borders of ancient Chinese states and Imperial China as protection against various nomadic groups from the Eurasian Steppe.",
|
7 |
+
"Albert Einstein was a German-born theoretical physicist, widely acknowledged to be one of the greatest physicists of all time. Einstein is known for developing the theory of relativity, but he also made important contributions to the development of the theory of quantum mechanics."
|
8 |
+
],
|
9 |
+
"labels": [
|
10 |
+
"The Eiffel Tower, located on the Champ de Mars in Paris, was designed and built by Gustave Eiffel's company.",
|
11 |
+
"Python, created by Guido van Rossum in 1991, is a high-level programming language that emphasizes code readability.",
|
12 |
+
"The Mona Lisa, a masterpiece of the Italian Renaissance, is the world's most famous and iconic piece of art, painted by Leonardo da Vinci.",
|
13 |
+
"The Great Wall of China, built along the northern borders of ancient Chinese states, served as protection against nomadic groups.",
|
14 |
+
"Albert Einstein, a German-born theoretical physicist, is renowned for his development of the theory of relativity and contributions to quantum mechanics."
|
15 |
+
]
|
16 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 0,
|
4 |
+
"decoder_start_token_id": 2,
|
5 |
+
"early_stopping": true,
|
6 |
+
"eos_token_id": 2,
|
7 |
+
"forced_bos_token_id": 0,
|
8 |
+
"forced_eos_token_id": 2,
|
9 |
+
"length_penalty": 2.0,
|
10 |
+
"max_length": 142,
|
11 |
+
"min_length": 56,
|
12 |
+
"no_repeat_ngram_size": 3,
|
13 |
+
"num_beams": 4,
|
14 |
+
"pad_token_id": 1,
|
15 |
+
"transformers_version": "4.38.1"
|
16 |
+
}
|
merges.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f24010df7a95669145bef23363ff1aad73abcb13171f39b8b61c16532a1f837
|
3 |
+
size 1222284056
|
tokenizer_config.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"model_max_length": 1024}
|
vocab.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|