Edit model card
YAML Metadata Warning: empty or missing yaml metadata in repo card (https://huggingface.co/docs/hub/model-cards#model-card-metadata)

import torch from transformers import T5TokenizerFast, T5ForConditionalGeneration

GPU ์‚ฌ์šฉ ์—ฌ๋ถ€ ํ™•์ธ

device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

๋ชจ๋ธ ๋ฐ ํ† ํฌ๋‚˜์ด์ € ๋ถˆ๋Ÿฌ์˜ค๊ธฐ

model_name = "jokh7802/KoT5_Summarization" tokenizer = T5TokenizerFast.from_pretrained(model_name) model = T5ForConditionalGeneration.from_pretrained(model_name).to(device)

ํ…Œ์ŠคํŠธ ๋ฌธ์žฅ

sample_text_3 = ( "์ธ๊ณต์ง€๋Šฅ ๊ธฐ์ˆ ์€ ํ˜„๋Œ€ ์‚ฌํšŒ์—์„œ ๋งค์šฐ ์ค‘์š”ํ•œ ์—ญํ• ์„ ํ•˜๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค. ๊ธฐ๊ณ„ ํ•™์Šต๊ณผ ๋”ฅ ๋Ÿฌ๋‹์˜ ๋ฐœ์ „์œผ๋กœ ์–ธ์–ด ์ฒ˜๋ฆฌ, ์ด๋ฏธ์ง€ ์ธ์‹, ์Œ์„ฑ ์ธ์‹, ์ž์œจ ์ฃผํ–‰ " "์ฐจ๋Ÿ‰ ๋ฐ ์˜๋ฃŒ ์ง„๋‹จ๊ณผ ๊ฐ™์€ ๋‹ค์–‘ํ•œ ๋ถ„์•ผ์—์„œ ๊ธ‰๊ฒฉํ•œ ์ง„๋ณด๊ฐ€ ์ด๋ฃจ์–ด์ง€๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค. ์ด๋Ÿฌํ•œ ๊ธฐ์ˆ ์€ ์šฐ๋ฆฌ์˜ ์‚ถ์„ ํฌ๊ฒŒ ๋ณ€ํ™”์‹œํ‚ค๊ณ  ์žˆ์œผ๋ฉฐ, ๋‹ค์–‘ํ•œ ์‚ฐ์—… ๋ถ„์•ผ์— " "์ƒˆ๋กœ์šด ๊ธฐํšŒ๋ฅผ ์ œ๊ณตํ•˜๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค. ๊ทธ๋Ÿฌ๋‚˜ ์ด๋Ÿฌํ•œ ๊ธฐ์ˆ  ๋ฐœ์ „์—๋Š” ๊ณ ๋ คํ•ด์•ผ ํ•  ์—ฌ๋Ÿฌ ์ค‘์š”ํ•œ ์ธก๋ฉด์ด ์žˆ์Šต๋‹ˆ๋‹ค. ์ธ๊ณต์ง€๋Šฅ ๊ธฐ์ˆ ์€ ๋ฐ์ดํ„ฐ์— ์˜์กดํ•˜๋ฉฐ, ๋ฐ์ดํ„ฐ์˜ ํ’ˆ์งˆ๊ณผ " "๊ฐœ์ธ ์ •๋ณด ๋ณดํ˜ธ๋Š” ๊ณ„์†ํ•ด์„œ ์ฃผ๋ชฉํ•ด์•ผ ํ•  ๋ฌธ์ œ์ž…๋‹ˆ๋‹ค. ๋˜ํ•œ, ์•Œ๊ณ ๋ฆฌ์ฆ˜์˜ ํˆฌ๋ช…์„ฑ๊ณผ ๊ณต์ •์„ฑ์— ๋Œ€ํ•œ ์šฐ๋ ค๋„ ๋†’์•„์ง€๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค. ์ธ๊ฐ„ ์ค‘์‹ฌ์˜ ๊ฐœ๋ฐœ๊ณผ ์œค๋ฆฌ์ ์ธ ์ฑ…์ž„์„ ์ค‘์‹œํ•˜๋Š” " "๋ฐฉํ–ฅ์œผ๋กœ ๊ธฐ์ˆ ์ด ๋ฐœ์ „ํ•ด์•ผ ํ•ฉ๋‹ˆ๋‹ค." "๋จธ์‹  ๋Ÿฌ๋‹ ๋ฐ ๋”ฅ ๋Ÿฌ๋‹์€ ๋Œ€๋Ÿ‰์˜ ๋ฐ์ดํ„ฐ๋ฅผ ๊ธฐ๋ฐ˜์œผ๋กœ ํ•™์Šตํ•˜๊ณ , ์ด๋ฅผ ํ†ตํ•ด ํŒจํ„ด์„ ์‹๋ณ„ํ•˜๊ณ  ์˜ˆ์ธกํ•ฉ๋‹ˆ๋‹ค. ์ด๋Ÿฌํ•œ ๋ชจ๋ธ์€ ์ด๋ฏธ์ง€, ์Œ์„ฑ, ํ…์ŠคํŠธ์™€ ๊ฐ™์€ ๋‹ค์–‘ํ•œ ํ˜•ํƒœ์˜ ๋ฐ์ดํ„ฐ๋ฅผ ์ฒ˜๋ฆฌํ•  ์ˆ˜ ์žˆ์œผ๋ฉฐ, " "์ด๋ฅผ ํ†ตํ•ด ์–ธ์–ด ๋ฒˆ์—ญ, ์Œ์„ฑ ์ธ์‹, ์–ผ๊ตด ์ธ์‹, ์ถ”์ฒœ ์‹œ์Šคํ…œ ๋ฐ ์˜ˆ์ธก ๋ถ„์„๊ณผ ๊ฐ™์€ ์‘์šฉ ํ”„๋กœ๊ทธ๋žจ์„ ๊ตฌํ˜„ํ•  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ํ•˜์ง€๋งŒ ์ด๋Ÿฌํ•œ ๋ชจ๋ธ์€ ๋ฐ์ดํ„ฐ์˜ ํŽธํ–ฅ์„ฑ์— ์˜ํ–ฅ์„ ๋ฐ›์„ ์ˆ˜ ์žˆ์œผ๋ฉฐ, " "์ด๋กœ ์ธํ•ด ๊ณต์ •ํ•˜์ง€ ์•Š์€ ๊ฒฐ๊ณผ๋ฅผ ๋‚ผ ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. ์ด๋ฅผ ๊ทน๋ณตํ•˜๊ธฐ ์œ„ํ•ด์„œ๋Š” ๋‹ค์–‘ํ•œ ๋ฐ์ดํ„ฐ๋ฅผ ์‚ฌ์šฉํ•˜๊ณ , ์•Œ๊ณ ๋ฆฌ์ฆ˜์„ ํ‰๊ฐ€ํ•˜๊ณ  ๊ฐœ์„ ํ•˜๋Š” ๋ฐ ์ง€์†์ ์ธ ๋…ธ๋ ฅ์ด ํ•„์š”ํ•ฉ๋‹ˆ๋‹ค." "๋˜ํ•œ, ์ธ๊ณต์ง€๋Šฅ์˜ ๋ฏธ๋ž˜์—๋Š” ์‹ค์šฉ์ ์ธ ๋ฌธ์ œ๋ฅผ ํ•ด๊ฒฐํ•˜๋Š” ๋ฐ ์ค‘์ ์„ ๋‘๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค. ์˜ˆ๋ฅผ ๋“ค์–ด ์˜๋ฃŒ ๋ถ„์•ผ์—์„œ๋Š” ์งˆ๋ณ‘ ์ง„๋‹จ ๋ฐ ์น˜๋ฃŒ์— ๋„์›€์„ ์ฃผ๋Š” ๊ธฐ์ˆ ์ด ๊ฐœ๋ฐœ๋˜๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค. ๋†์—… ๋ถ„์•ผ์—์„œ๋Š” " "์ž‘๋ฌผ ์ƒ์‚ฐ์„ฑ์„ ํ–ฅ์ƒ์‹œํ‚ค๊ธฐ ์œ„ํ•œ ์ง€๋Šฅํ˜• ๋†์—… ๊ธฐ์ˆ ์ด ์ ์šฉ๋˜๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค. ๋˜ํ•œ, ์Šค๋งˆํŠธ ์‹œํ‹ฐ ๊ธฐ์ˆ ์€ ๋„์‹œ์˜ ํšจ์œจ์„ฑ๊ณผ ์ง€์† ๊ฐ€๋Šฅ์„ฑ์„ ํ–ฅ์ƒ์‹œํ‚ค๋Š” ๋ฐ ๊ธฐ์—ฌํ•˜๊ณ  ์žˆ์Šต๋‹ˆ๋‹ค. ์ด๋Ÿฌํ•œ ํ˜์‹ ์ ์ธ ์ ์šฉ ๋ถ„์•ผ์—์„œ๋Š” " "๊ธฐ์ˆ ๊ณผ ์œค๋ฆฌ๊ฐ€ ์กฐํ™”๋ฅผ ์ด๋ฃจ๋ฉฐ ์‚ฌํšŒ์  ๊ฐ€์น˜๋ฅผ ์ฐฝ์ถœํ•˜๋Š” ๋ฐฉํ–ฅ์œผ๋กœ ๋‚˜์•„๊ฐ€์•ผ ํ•ฉ๋‹ˆ๋‹ค." )

input_text = sample_text_3

๋ฌธ์žฅ์„ ํ† ํฐํ™”ํ•˜๊ณ  ์š”์•ฝ ์ƒ์„ฑ

input_ids = tokenizer.encode(input_text, return_tensors="pt", max_length=512, truncation=True).to(device) output = model.generate(input_ids, max_length=150, num_beams=4, length_penalty=2.0, early_stopping=True)

์ƒ์„ฑ๋œ ์š”์•ฝ์„ ๋””์ฝ”๋”ฉํ•˜์—ฌ ์ถœ๋ ฅ

summary = tokenizer.decode(output[0], skip_special_tokens=True) print("Original Sentence: ", input_text) print("Generated Summary: ", summary)

#์ถœ๋ ฅ๊ฒฐ๊ณผ #Original Sentence: ์ด ๋ชจ๋ธ์€ ํ•œ๊ตญ์–ด ๋ฌธ์žฅ์„ ํšจ๊ณผ์ ์œผ๋กœ ์š”์•ฝํ•˜๋Š” ๋ฐ ์‚ฌ์šฉ๋  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค. #Generated Summary: ํ•œ๊ตญ์–ด ๋ฌธ์žฅ์„ ํšจ๊ณผ์ ์œผ๋กœ ์š”์•ฝํ•˜๋Š” ๋ฐ ์ด ๋ชจ๋ธ์€ ํ•œ๊ตญ์–ด ๋ฌธ์žฅ์„ ํšจ๊ณผ์ ์œผ๋กœ ์š”์•ฝํ•˜๋Š” ๋ฐ ์‚ฌ์šฉ๋  ์ˆ˜ ์žˆ์Šต๋‹ˆ๋‹ค.

Downloads last month
5
Safetensors
Model size
95.6M params
Tensor type
F32
ยท