from transformers import PegasusForConditionalGeneration from tokenizers_pegasus import PegasusTokenizer import re import pandas as pd import jieba import jieba.analyse as jay import paddle from pyecharts import options as opts from pyecharts.charts import Funnel paddle.enable_static() # -*- coding: utf-8 -*- ARTICLE_PATH = '2.xlsx' CACHE_PATH = '' def get_keywords_in_article(): def key_word(data): data = str(data).strip() result = re.findall(pattern='pan>(.*?)