Spaces:

cheesexuebao
/

murphy

Sleeping

+import pandas as pd
+from tqdm.auto import tqdm
+import torch
+from transformers import BertTokenizerFast as BertTokenizer, BertForSequenceClassification
+import os
+import glob
+RANDOM_SEED = 42
+pd.RANDOM_SEED = 42
+LABEL_COLUMNS = ["Assertive Tone", "Conversational Tone", "Emotional Tone", "Informative Tone"]
+@torch.no_grad()
+def predict_csv(data, text_col, tokenizer, model, device, text_bs=16, max_token_len=128):
+    predictions = []
+    post = data[text_col]
+    num_text = len(post)
+    generator = range(0, num_text, text_bs)
+    for i in tqdm(generator, total=len(generator), desc="Processing..."):
+      texts = post[i: min(num_text, i+text_bs)].tolist()
+      encoding = tokenizer(
+          texts,
+          add_special_tokens=True,
+          max_length=max_token_len,
+          return_token_type_ids=False,
+          padding="max_length",
+          truncation=True,
+          return_attention_mask=True,
+          return_tensors='pt',
+        )
+      logits = model(
+          encoding["input_ids"].to(device),
+          encoding["attention_mask"].to(device),
+          return_dict=True
+      ).logits
+      prediction = torch.sigmoid(logits)
+      predictions.append(prediction.detach().cpu())
+    final_pred = torch.cat(predictions, dim=0)
+    y_inten = final_pred.numpy().T
+    data[LABEL_COLUMNS[0]] = y_inten[0].tolist()
+    data[LABEL_COLUMNS[1]] = y_inten[1].tolist()
+    data[LABEL_COLUMNS[2]] = y_inten[2].tolist()
+    data[LABEL_COLUMNS[3]] = y_inten[3].tolist()
+    return data
+@torch.no_grad()
+def predict_single(sentence, tokenizer, model, device, max_token_len=128):
+    encoding = tokenizer(
+        sentence,
+        add_special_tokens=True,
+        max_length=max_token_len,
+        return_token_type_ids=False,
+        padding="max_length",
+        truncation=True,
+        return_attention_mask=True,
+        return_tensors='pt',
+      )
+    logits = model(
+        encoding["input_ids"].to(device),
+        encoding["attention_mask"].to(device),
+        return_dict=True
+    ).logits
+    prediction = torch.sigmoid(logits)
+    y_inten = prediction.flatten().cpu().numpy().T.tolist()
+    return y_inten
+def model_factory(local_path, device):
+  manager = {}
+  for model_path in glob.glob(f"{local_path}/*"):
+    base_name = os.path.basename(model_path)
+    model_name = os.path.splitext(base_name)[0]
+    tokenizer = BertTokenizer.from_pretrained(model_path)
+    model = BertForSequenceClassification.from_pretrained(model_path)
+    model = model.to(device)
+    manager[model_name] = {
+       "model": model,
+       "tokenizer": tokenizer
+    }
+  return manager
+if __name__ == "__main__":
+  Data = pd.read_csv("Kickstarter_sentence_level_5000.csv")
+  Data = Data[:20]
+  device = torch.device('cpu')
+  manager = model_factory("./models", device)
+  for model_name, dct in manager.items():
+    model, tokenizer = dct['model'], dct['tokenizer']
+    fk_doc_result = predict_csv(Data,"content", tokenizer, model, device)
+    single_response = predict_single("Games of the imagination teach us actions have consequences in a realm that can be reset.", tokenizer, model, device)
+    fk_doc_result.to_csv(f"output/prediction_{model_name}.csv")

app.py CHANGED Viewed

@@ -1,54 +1,132 @@
 import gradio as gr
 import pandas as pd
 import matplotlib.pyplot as plt
-# from Prediction import *
-# 定义处理函数
-def process_data(csv_file, num, model_name):
-    # 读取CSV文件
     df = pd.read_csv(csv_file.name)
-    # 处理数据
-    processed_data = df * num
-    # 生成图片
-    plt.plot(processed_data)
-    plt.xlabel('X Label')
-    plt.ylabel('Y Label')
-    plt.title('Processed Data')
-    plt.grid(True)
-    plt.savefig('output.png')
-    plt.close()
-    # 生成字符串结果
-    result = pd.DataFrame({'result':[1,2,3]})
-    result.to_csv('output.csv')
-    print(model_name)
-    return 'output.csv', ['output.png','output.png']
-my_theme = gr.Theme.from_hub("gstaff/sketch")
-with gr.Blocks(theme=my_theme, title='Test') as demo:
-    gr.Markdown("""# Test
-    xxxx
-    """)
     with gr.Tab("Single Sentence"):
-        with gr.Column():
-            csv_input = gr.File(label="CSV文件")
-            text_output = gr.File(label="结果")
-            image_output = gr.Gallery(label="图像")
         with gr.Row():
-            seed_input = gr.Slider(minimum=0, maximum=100, step=1, label="seed",info="Different seeds may generate different results")
-            model_input = gr.CheckboxGroup(["ALL_Data", "Facebook", "Kickstarter", "Twitter"], label="Countries", info="Where are they from?")
         with gr.Row():
             button = gr.Button("Submit", variant="primary")
-            button.click(fn=process_data, inputs=[csv_input, seed_input, model_input], outputs=[text_output, image_output])
-            clear = gr.ClearButton([csv_input, text_output, image_output])
-    with gr.Tab("Csv File"):
-        ...
-    with gr.Tab("README"):
-        seed_input = gr.Textbox(label="seed")
 demo.launch()

 import gradio as gr
 import pandas as pd
 import matplotlib.pyplot as plt
+from Prediction import *
+import os
+from datetime import datetime
+examples = []
+if os.path.exists("assets/examples.txt"):
+    with open("assets/examples.txt", "r", encoding="utf8") as file:
+        for sentence in file:
+            sentence = sentence.strip()
+            examples.append(sentence)
+else:
+    examples = [
+        "Games of the imagination teach us actions have consequences in a realm that can be reset.",
+        "But New Jersey farmers are retiring and all over the state, development continues to push out dwindling farmland.",
+        "He also is the Head Designer of The Design Trust so-to-speak, besides his regular job ..."
+        ]
+device = torch.device('cpu')
+manager = model_factory("./models", device)
+def single_sentence(sentence, model_select):
+    df = []
+    for model_name in model_select:
+        dct = manager[model_name]
+        model, tokenizer = dct['model'], dct['tokenizer']
+        predictions = predict_single(sentence, tokenizer, model, device)
+        df.append([model_name] + predictions)
+    return df
+def csv_process(csv_file, model_select, attr="content"):
+    current_time = datetime.now()
+    formatted_time = current_time.strftime("%Y_%m_%d_%H_%M_%S")
     df = pd.read_csv(csv_file.name)
+    outputs = []
+    for model_name in model_select:
+        data = df.copy(deep=True)
+        dct = manager[model_name]
+        model, tokenizer = dct['model'], dct['tokenizer']
+        predictions = predict_csv(data, attr, tokenizer, model, device)
+        output_path = f"output/prediction_{model_name}_{formatted_time}.csv"
+        predictions.to_csv(output_path)
+        outputs.append(output_path)
+    return outputs
+my_theme = gr.Theme.from_hub("JohnSmith9982/small_and_pretty")
+with gr.Blocks(theme=my_theme, title='XXX') as demo:
+    gr.HTML(
+        """
+        <div style="display: flex; justify-content: center; align-items: center; text-align: center;">
+        <a href="https://github.com/xxx" style="margin-right: 20px; text-decoration: none; display: flex; align-items: center;">
+        </a>
+        <div>
+            <h1 >Place the title of the paper here</h1>
+            <h5 style="margin: 0;">If you like our project, please give us a star ✨ on Github for the latest update.</h5>
+            <div style="display: flex; justify-content: center; align-items: center; text-align: center;>
+                <a href="https://arxiv.org/abs/xx.xx"><img src="https://img.shields.io/badge/Arxiv-xx.xx-red"></a>
+                <a href='https://huggingface.co/spaces/cheesexuebao/murphy'><img src='https://img.shields.io/badge/Project_Page-Murphy/xxBert' alt='Project Page'></a>
+                <a href='https://github.com'><img src='https://img.shields.io/badge/Github-Code-blue'></a>
+            </div>
+        </div>
+        </div>
+        """)
     with gr.Tab("Single Sentence"):
         with gr.Row():
+            tbox_input = gr.Textbox(label="Input",
+                                    info="Please input a sentence here:")
+            model_select = gr.CheckboxGroup(manager.keys(),
+                                            label="Models:",
+                                            info="Selecting different model variants to obtain aggregated predictions.")
+        tab_output = gr.DataFrame(label='Probability Predictions:',
+                                  headers=["model"] + LABEL_COLUMNS,
+                                  datatype=["str"] * (len(LABEL_COLUMNS)+1),
+                                  interactive=False,
+                                  wrap=True)
+        with gr.Row():
+            button_ss = gr.Button("Submit", variant="primary")
+            button_ss.click(fn=single_sentence, inputs=[tbox_input, model_select], outputs=[tab_output])
+            gr.ClearButton([tbox_input, tab_output])
+        gr.Markdown("## Examples")
+        gr.Examples(
+            examples=examples,
+            inputs=tbox_input,
+            examples_per_page=5
+        )
+    with gr.Tab("Csv File"):
+        with gr.Row():
+            csv_input = gr.File(label="CSV File:",
+                                file_types=['.csv'],
+                                file_count="single"
+                                )
+            csv_output = gr.File(label="Predictions:")
+        model_select = gr.CheckboxGroup(manager.keys(),
+                label="Models:",
+                info="Selecting different model variants to obtain aggregated predictions.")
         with gr.Row():
             button = gr.Button("Submit", variant="primary")
+            button.click(fn=csv_process, inputs=[csv_input, model_select], outputs=[csv_output])
+            gr.ClearButton([csv_input, csv_output])
+        gr.Markdown("## Examples")
+        gr.Examples(
+            examples=["assets/csv_examples.csv",],
+            inputs=csv_input
+        )
+    with gr.Tab("Readme"):
+        gr.Markdown(
+            """
+            # Paper Name
+            # Authors
+            + First author
+            + Corresponding author
+            # Detailed Information
+            ...
+            """
+        )
 demo.launch()

assets/Kickstarter_sentence_level_5000.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

assets/Prediction.py.bak ADDED Viewed

	@@ -0,0 +1,129 @@

+### install the needed package
+# !pip install transformers
+# !pip install torchmetrics
+# !pip3 install ogb pytorch_lightning -q
+import pandas as pd
+from tqdm.auto import tqdm
+import torch
+import torch.nn as nn
+from torch.utils.data import DataLoader, Dataset
+from transformers import BertTokenizerFast as BertTokenizer, BertModel, AdamW, get_linear_schedule_with_warmup
+# import pytorch_lightning as pl
+pd.set_option('display.max_columns', 500)
+RANDOM_SEED = 42
+class ModelTagger(nn.Module):
+  def __init__(self, model_path="bert-base-uncased"):
+    super().__init__()
+    self.bert = BertModel.from_pretrained(model_path, return_dict=True)
+    self.classifier = nn.Linear(self.bert.config.hidden_size, 4)
+    self.criterion = nn.BCELoss()
+  def forward(self, input_ids, attention_mask, labels=None):
+    output = self.bert(input_ids, attention_mask=attention_mask)
+    output = self.classifier(output.pooler_output)
+    output = torch.sigmoid(output)
+    loss = 0
+    if labels is not None:
+        loss = self.criterion(output, labels)
+    return loss, output
+class Predict_Dataset(Dataset):
+  def __init__(
+    self,
+    data: pd.DataFrame,
+    text_col: str,
+    tokenizer: BertTokenizer,
+    max_token_len: int = 128
+  ):
+    self.text_col = text_col
+    self.tokenizer = tokenizer
+    self.data = data
+    self.max_token_len = max_token_len
+  def __len__(self):
+    return len(self.data)
+  def __getitem__(self, index: int):
+    data_row = self.data.iloc[index]
+    post = data_row[self.text_col]
+    encoding = self.tokenizer.encode_plus(
+      post,
+      add_special_tokens=True,
+      max_length=self.max_token_len,
+      return_token_type_ids=False,
+      padding="max_length",
+      truncation=True,
+      return_attention_mask=True,
+      return_tensors='pt',
+    )
+    return dict(
+      post=post,
+      input_ids=encoding["input_ids"].flatten(),
+      attention_mask=encoding["attention_mask"].flatten(),
+    )
+def predict(data, text_col, tokenizer, model, device, LABEL_COLUMNS, max_token_len=128):
+    predictions = []
+    df_token = Predict_Dataset(data, text_col, tokenizer, max_token_len=max_token_len)
+    loader = DataLoader(df_token, batch_size=1000, num_workers=0)
+    for item in tqdm(loader):
+        _, prediction = model(
+            item["input_ids"].to(device),
+            item["attention_mask"].to(device)
+        )
+        predictions.append(prediction.detach().cpu())
+    final_pred = torch.cat(predictions, dim=0)
+    y_inten = final_pred.numpy().T
+    return {
+        LABEL_COLUMNS[0]: y_inten[0].tolist(),
+        LABEL_COLUMNS[1]: y_inten[1].tolist(),
+        LABEL_COLUMNS[2]: y_inten[2].tolist(),
+    LABEL_COLUMNS[3]: y_inten[3].tolist()
+    }
+def get_result(df, result, LABEL_COLUMNS):
+  df[LABEL_COLUMNS[0]] = result[LABEL_COLUMNS[0]]
+  df[LABEL_COLUMNS[1]] = result[LABEL_COLUMNS[1]]
+  df[LABEL_COLUMNS[2]] = result[LABEL_COLUMNS[2]]
+  df[LABEL_COLUMNS[3]] = result[LABEL_COLUMNS[3]]
+  return df
+Data = pd.read_csv("Kickstarter_sentence_level_5000.csv")
+Data = Data[:20]
+device = torch.device('cpu')
+BERT_MODEL_NAME = 'bert-base-uncased'
+tokenizer = BertTokenizer.from_pretrained(BERT_MODEL_NAME)
+LABEL_COLUMNS = ["Assertive Tone", "Conversational Tone", "Emotional Tone", "Informative Tone"]
+params = torch.load("checkpoints/Kickstarter.ckpt", map_location='cpu')['state_dict']
+kick_model = ModelTagger()
+kick_model.load_state_dict(params, strict=True)
+kick_model.eval()
+kick_model = kick_model.to(device)
+kick_fk_doc_result = predict(Data,"content", tokenizer,kick_model, device, LABEL_COLUMNS)
+fk_result = get_result(Data, kick_fk_doc_result, LABEL_COLUMNS)
+fk_result.to_csv("output/prediction_origin_Kickstarter.csv")

assets/csv_examples.csv ADDED Viewed

	@@ -0,0 +1,30 @@

+,index,content,word_count
+0,225644,The first prototype did not clip together well and had strength issues so we redesigned it with new sides and a different tabs structure.,24
+1,989071,Maybe you own a shop or perhaps you and your friends want to go in on this together to save some money.,22
+2,332310,"With this campaign we want to propose ""Eternity Dice Regular and Charms Edition"", sculpted by hand in stone, with a polished finish and highly accurate details.",26
+3,101474,"It's hand cut from a thick and reliable high quality calf skin, which is soft and flexible enough for wearing with utmost comfort.",23
+4,1641986,"a#  by  5       WHAT SEPARATES US FROM THE COMPETITION     a lax-ll 360 AUDIO FLOATABLE Full submergable up to Superior surround sound Counter balanced for optimal 1 meter for 30 minutes audio direction while floating     WIRELESS SPECIFICATIONS MATERIALS  sarr of whreless Small and compact, with Engineered to perfection streaming range enormous sound with the highest quality  materials avalable     PRICE-POINT WARRANTY BVURABILITY  Affordable technology Cone yearlimited warranty | Rubberized shock absorbing cover     PATENTS BUILT-IN MIC BATTERY LIFE  Patent.Pending stabalization .",78
+5,1632938,Much of the known world is either from this culture or has converted to the faith.,16
+6,1141502,"The more I play it, the more I want to play it.",12
+7,1424712,"There are weapons all around you, you just never thought about your household goods that way.",16
+8,460625,"In September, I'm going down to Virginia with a bunch of my music buddies to record the album.",18
+9,179267,"It is suitable for use with Cthulhu, Horror, Space and Dungeon - style miniature games.",15
+10,1092530,Games of the imagination teach us actions have consequences in a realm that can be reset.,16
+11,1050585,"Intense cleaning of the existing space, brick repairs, and removal of unneeded materials is also necessary.",16
+12,1126342,These will include color artwork and fully designed stats to help you build exciting and unique Shadowlands encounters.,18
+13,277427,"If you're leaving the backpack unattended, the bag itself can be secured to almost any fixed object using the integrated steel wire and combination lock, making it impossible for opportunistic thieves to access your belongings or steal the bag, without special cutting equipment.",43
+14,307425,Their parents had recruited the police and even had the church issuing official statements forbidding the girls to walk through monastery doors.,22
+15,611566,is a childrenâs book for elementary school age kids with illustrations appealing to people of all ages.,17
+16,951173,"Thanks to you we reached our original goal, so we got festival fees and insurance covered.",16
+17,1294624,"Â It's been really well-received, and recently won an online award for Best New Tabletop Sports Game of 2013.",19
+18,686912,"But New Jersey farmers are retiring and all over the state, development continues to push out dwindling farmland.",18
+19,1291430,"Support Cards for easily setting initiative and keeping track of hit points, ammo, etc, speeding things up and eliminating the need for any writing/erasing Deep character creation with options designed for interesting roleplaying, and super fast to create (5 minutes or less) Specially laminated Character Cards take the place of the old character sheet, making information extremely easy to find and removing clutter from the gaming table Easily expandable without having to purchase and read through lengthy new books - newÂ equipment, weapons, powers, skills, and opponents can be instantly added to your game with Setting Cards All special rules for equipment, weapons, powers, skills, and opponents printed on cards kept in player hands, so you never have to go searching for them Completely genre neutral, so assets from any setting are completely compatible with any others, making your game infinitely expandable and customizable Tech-themed Resolution Deck Concept Built from the ground up with VTTs (Virtual Table Tops) in mind, with all digital assets ready to drop into your game to integrate seamlessly with groups who play remotely Complete playable module with starter adventure included in backer rewards of $10 or more!",192
+20,1656635,"Their bond of friendship makes the journey more important than the destination as they share their dreams, frustrations and fears.Â The story goes on to show the dramatic impact this innocent childhood adventure has on their young adult lives.",39
+21,1679298,"He also is the Head Designer of The Design Trust so-to-speak, besides his regular job ...",16
+22,337389,"This year, the film team has plans to produce a short comedy, based on a true story set in the city of Jerusalem.",23
+23,980529,"$12,000 - Roguelike Player Mat This player mat will include extra rules to play Baldrick's Tomb as a solo player Roguelike.",21
+24,1700094,_ Thank you for viewing the project!,7
+25,420192,We appreciate your support and thank you for joining us in helping cause this mission stay in action.,18
+26,1469419,It'll even be foil-wrapped like baseball cards!,7
+27,105008,We believe that the major players with their massive branding campaigns together with the margins applied by distributors and retailers are a business model that doesnât deliver a fair value to customers.,32
+28,1505209,"If you want to take advantage of the Rhino Slider's versatility, you'll have an option to add extra sets of rails after the campaign ends.",25

assets/examples.txt ADDED Viewed

	@@ -0,0 +1,14 @@

+Games of the imagination teach us actions have consequences in a realm that can be reset.
+Intense cleaning of the existing space, brick repairs, and removal of unneeded materials is also necessary.
+Thanks to you we reached our original goal, so we got festival fees and insurance covered.
+Â It's been really well-received, and recently won an online award for Best New Tabletop Sports Game of 2013.
+But New Jersey farmers are retiring and all over the state, development continues to push out dwindling farmland.
+Our chemical-free process provides unmatched comfort.
+However, this chart does not factor in special ability influence since that varies with the ability being used.
+I'd like to do something similar with pictures.
+This means you can feel more than comfortable putting them in your back pocket or purse.
+She holds a degree from the Advertising University of Madrid.
+Skeleton Birds are heading to Groovebox Studios on March 17th to record and film a live GBS Detroit EP and video.
+Please help support us & make this awesome case a reality!
+So... We're asking for $3,000 per song.
+You also have battle items and action cards to defeat your gnome enemies.

convert.py ADDED Viewed

	@@ -0,0 +1,28 @@

+import torch
+import glob
+import os
+from transformers import BertTokenizerFast as BertTokenizer, BertForSequenceClassification
+LABEL_COLUMNS = ["Assertive Tone", "Conversational Tone", "Emotional Tone", "Informative Tone"]
+tokenizer = BertTokenizer.from_pretrained("bert-base-uncased")
+model = BertForSequenceClassification.from_pretrained("bert-base-uncased", num_labels=4)
+id2label = {i:label for i,label in enumerate(LABEL_COLUMNS)}
+label2id = {label:i for i,label in enumerate(LABEL_COLUMNS)}
+for ckpt in glob.glob('checkpoints/*.ckpt'):
+    base_name = os.path.basename(ckpt)
+    # 去除文件后缀
+    model_name = os.path.splitext(base_name)[0]
+    params = torch.load(ckpt, map_location="cpu")['state_dict']
+    msg = model.load_state_dict(params, strict=True)
+    path = f'models/{model_name}'
+    os.makedirs(path, exist_ok=True)
+    torch.save(model.state_dict(), f'{path}/pytorch_model.bin')
+    config = model.config
+    config.architectures = ['BertForSequenceClassification']
+    config.label2id = label2id
+    config.id2label = id2label
+    model.config.to_json_file(f'{path}/config.json')
+    tokenizer.save_vocabulary(path)

{bert-base-uncased → models/All_Data}/config.json RENAMED Viewed

@@ -1,14 +1,28 @@
 {
   "architectures": [
-    "BertForMaskedLM"
   ],
   "attention_probs_dropout_prob": 0.1,
   "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "model_type": "bert",
@@ -16,7 +30,7 @@
   "num_hidden_layers": 12,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
-  "transformers_version": "4.6.0.dev0",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 30522

 {
+  "_name_or_path": "bert-base-uncased",
   "architectures": [
+    "BertForSequenceClassification"
   ],
   "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
   "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
+  "id2label": {
+    "0": "Assertive Tone",
+    "1": "Conversational Tone",
+    "2": "Emotional Tone",
+    "3": "Informative Tone"
+  },
   "initializer_range": 0.02,
   "intermediate_size": 3072,
+  "label2id": {
+    "Assertive Tone": 0,
+    "Conversational Tone": 1,
+    "Emotional Tone": 2,
+    "Informative Tone": 3
+  },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "model_type": "bert",
   "num_hidden_layers": 12,
   "pad_token_id": 0,
   "position_embedding_type": "absolute",
+  "transformers_version": "4.36.2",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 30522

{bert-base-uncased → models/All_Data}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:097417381d6c7230bd9e3557456d726de6e83245ec8b24f529f60198a67b203a
-size 440473133

 version https://git-lfs.github.com/spec/v1
+oid sha256:4edf18d14298c9a7057bbbdbc88cddf3b673e452103c6c4b882e1cec14d51c53
+size 438021294

{bert-base-uncased → models/All_Data}/vocab.txt RENAMED Viewed

File without changes

bert-base-uncased/bert_config.json → models/Facebook/config.json RENAMED Viewed

@@ -1,13 +1,37 @@
 {
   "attention_probs_dropout_prob": 0.1,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "max_position_embeddings": 512,
   "num_attention_heads": 12,
   "num_hidden_layers": 12,
   "type_vocab_size": 2,
   "vocab_size": 30522
 }

 {
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
   "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
   "hidden_act": "gelu",
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
+  "id2label": {
+    "0": "Assertive Tone",
+    "1": "Conversational Tone",
+    "2": "Emotional Tone",
+    "3": "Informative Tone"
+  },
   "initializer_range": 0.02,
   "intermediate_size": 3072,
+  "label2id": {
+    "Assertive Tone": 0,
+    "Conversational Tone": 1,
+    "Emotional Tone": 2,
+    "Informative Tone": 3
+  },
+  "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
+  "model_type": "bert",
   "num_attention_heads": 12,
   "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "transformers_version": "4.36.2",
   "type_vocab_size": 2,
+  "use_cache": true,
   "vocab_size": 30522
 }

models/Facebook/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f511b8b4b91b5fa408c5b3220ce0fe9b61b2f9a3a54dd00acb3a81aa0a2a19e8
+size 438021294

models/Facebook/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

models/Kickstarter/config.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Assertive Tone",
+    "1": "Conversational Tone",
+    "2": "Emotional Tone",
+    "3": "Informative Tone"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Assertive Tone": 0,
+    "Conversational Tone": 1,
+    "Emotional Tone": 2,
+    "Informative Tone": 3
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "transformers_version": "4.36.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

models/Kickstarter/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b98553cd5a9b23babc4e20ade9abda931497de3103acf09656eb39cfcbb0c485
+size 438021294

models/Kickstarter/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

models/Twitter/config.json ADDED Viewed

	@@ -0,0 +1,37 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "id2label": {
+    "0": "Assertive Tone",
+    "1": "Conversational Tone",
+    "2": "Emotional Tone",
+    "3": "Informative Tone"
+  },
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "label2id": {
+    "Assertive Tone": 0,
+    "Conversational Tone": 1,
+    "Emotional Tone": 2,
+    "Informative Tone": 3
+  },
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "transformers_version": "4.36.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

models/Twitter/pytorch_model.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6abf83c8c66c4f3fcaba340dcab3b5b1f4f2b66381b21a5aacab086194cf0cbd
+size 438021294

models/Twitter/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

requirements.txt CHANGED Viewed

@@ -1,4 +1,5 @@
 torch
 transformers
 tqdm
-pandas

 torch
 transformers
 tqdm
+pandas
+datetime