Spaces:

nkigumnov
/

banks-ethics-sentiment

Build error

App Files Files Community

nkigumnov commited on Apr 17, 2023

Commit

a2887cd

•

1 Parent(s): 9ae54b8

Upload 5 files

Browse files

Files changed (5) hide show

app.py +47 -0
best_model_bert.pth +3 -0
best_model_heads.pth +3 -0
model.py +153 -0
requirements.txt +5 -0

app.py ADDED Viewed

	@@ -0,0 +1,47 @@

+import gradio as gr
+from model import inference
+def predict(sentence: str):
+    model_response = inference({"sentence": sentence})
+    prob = model_response["answer"]
+    df = {
+        "1": float(prob[1][0][2]),
+        "0": float(prob[1][0][1]),
+        "-1": float(prob[1][0][0]),
+        "Communication": float(prob[0][0][0]),
+        "Quality": float(prob[0][0][1]),
+        "Price": float(prob[0][0][2]),
+        "Safety": float(prob[0][0][3]),
+    }
+    return (
+        df["1"],
+        df["0"],
+        df["-1"],
+        df["Communication"],
+        df["Quality"],
+        df["Price"],
+        df["Safety"],
+    )
+if __name__ == "__main__":
+    print("App started")
+    demo = gr.Interface(
+        fn=predict,
+        title="Try it yourself!",
+        inputs=gr.Textbox(lines=3, placeholder="Sentence here..."),
+        outputs=[
+            gr.Number(0.0, label="1"),
+            gr.Number(0.0, label="0"),
+            gr.Number(0.0, label="-1"),
+            gr.Number(0.0, label="Communication"),
+            gr.Number(0.0, label="Quality"),
+            gr.Number(0.0, label="Price"),
+            gr.Number(0.0, label="Safety"),
+        ],
+    )
+    demo.launch(server_name="0.0.0.0", server_port=8080)

best_model_bert.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2183c10359aa1a55a8510ed1d8c3a02678b0f0aa585f8a931e9db5493db7cc21
+size 709923201

best_model_heads.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5796bc27244f82089e1950d4d308b2ca8c06b7e649fd2acf0ec859cef121465e
+size 136297

model.py ADDED Viewed

	@@ -0,0 +1,153 @@

+#!g1.1
+import torch
+import torch.nn as nn
+from transformers import AutoTokenizer, AutoModel
+import copy
+class DL_category(nn.Module):
+    def __init__(self):
+        super(DL_category, self).__init__()
+        self.lin1 = nn.Linear(256, 64)
+        nn.init.xavier_uniform_(self.lin1.weight)
+        self.lin2 = nn.Linear(64, 5)
+        nn.init.xavier_uniform_(self.lin2.weight)
+    def forward(self, x):
+        x = torch.relu(self.lin1(x))
+        x = self.lin2(x)
+        return x
+class DL_sentiment(nn.Module):
+    def __init__(self):
+        super(DL_sentiment, self).__init__()
+        self.lin1 = nn.Linear(256, 64)
+        nn.init.xavier_uniform_(self.lin1.weight)
+        self.lin2 = nn.Linear(64, 1, bias=False)
+        nn.init.xavier_uniform_(self.lin2.weight)
+    def forward(self, x):
+        x = torch.relu(self.lin1(x))
+        x = self.lin2(x)
+        return x
+def mean_pooling(model_output, attention_mask):
+    input_mask_expanded = attention_mask.unsqueeze(-1).expand(model_output.size()).float()
+    sum_embeddings = torch.sum(model_output * input_mask_expanded, 1)
+    sum_mask = torch.clamp(input_mask_expanded.sum(1), min=1e-9)
+    return sum_embeddings / sum_mask
+class Union_model(nn.Module):
+    def __init__(self, bert_model):
+        super(Union_model, self).__init__()
+        bert_model = bert_model
+        for name, param in bert_model.named_parameters():
+            param.requires_grad = False
+        bert_model.pooler = nn.Sequential(
+            nn.Linear(in_features=768, out_features=256)
+        )
+        bert_model = bert_model.to('cpu')
+        #         print(bert_model.parameters)
+        self.DL_cat = DL_category()
+        self.DL_sent = DL_sentiment()
+    def forward(self, input):
+        output = bert_model(**input)
+        output = output.pooler_output
+        output = mean_pooling(output, input['attention_mask'])
+        return self.DL_cat(output), self.DL_sent(output)
+class LogisticCumulativeLink(nn.Module):
+    """
+    Converts a single number to the proportional odds of belonging to a class.
+    Parameters
+    ----------
+    num_classes : int
+        Number of ordered classes to partition the odds into.
+    init_cutpoints : str (default='ordered')
+        How to initialize the cutpoints of the model. Valid values are
+        - ordered : cutpoints are initialized to halfway between each class.
+        - random : cutpoints are initialized with random values.
+    """
+    def __init__(self, num_classes: int,
+                 init_cutpoints: str = 'ordered') -> None:
+        assert num_classes > 2, (
+            'Only use this model if you have 3 or more classes'
+        )
+        super().__init__()
+        self.num_classes = num_classes
+        self.init_cutpoints = init_cutpoints
+        if init_cutpoints == 'ordered':
+            num_cutpoints = self.num_classes - 1
+            cutpoints = torch.arange(num_cutpoints).float() - num_cutpoints / 2
+            self.cutpoints = nn.Parameter(cutpoints)
+        elif init_cutpoints == 'random':
+            cutpoints = torch.rand(self.num_classes - 1).sort()[0]
+            self.cutpoints = nn.Parameter(cutpoints)
+        else:
+            raise ValueError(f'{init_cutpoints} is not a valid init_cutpoints '
+                             f'type')
+    def forward(self, X: torch.Tensor) -> torch.Tensor:
+        """
+        Equation (11) from
+        "On the consistency of ordinal regression methods", Pedregosa et. al.
+        """
+        sigmoids = torch.sigmoid(self.cutpoints - X)
+        link_mat = sigmoids[:, 1:] - sigmoids[:, :-1]
+        link_mat = torch.cat((
+            sigmoids[:, [0]],
+            link_mat,
+            (1 - sigmoids[:, [-1]])
+        ),
+            dim=1
+        )
+        return link_mat
+class CustomOrdinalLogisticModel(nn.Module):
+    def __init__(self, predictor: nn.Module, num_classes: int,
+                 init_cutpoints: str = 'ordered') -> None:
+        super().__init__()
+        self.num_classes = num_classes
+        self.predictor = copy.deepcopy(predictor)
+        self.link = LogisticCumulativeLink(self.num_classes,
+                                           init_cutpoints=init_cutpoints)
+    def forward(self, *args, **kwargs) -> torch.Tensor:
+        cat, sent = self.predictor(*args, **kwargs)
+        return cat, self.link(sent)
+tokenizer = AutoTokenizer.from_pretrained('blanchefort/rubert-base-cased-sentiment-rusentiment')
+bert_model = AutoModel.from_pretrained('blanchefort/rubert-base-cased-sentiment-rusentiment',
+                                       output_hidden_states=True).to('cpu')
+bert_model.pooler = nn.Sequential(
+    nn.Linear(in_features=768, out_features=256)
+)
+model = CustomOrdinalLogisticModel(Union_model(bert_model), 3).to('cpu')
+model.load_state_dict(torch.load('best_model_heads.pth', map_location='cpu'), strict=False)
+bert_model.load_state_dict(torch.load('best_model_bert.pth', map_location='cpu'))
+def inference(input_data):
+    tokenized = tokenizer(input_data['sentence'])
+    input_ids = torch.LongTensor(tokenized['input_ids']).unsqueeze(0).to('cpu')
+    attention_mask = torch.IntTensor(tokenized['attention_mask']).unsqueeze(0).to('cpu')
+    model.eval()
+    return dict(answer=model({'input_ids': input_ids, 'attention_mask': attention_mask}))

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+gradio~=3.27.0
+requests~=2.28.2
+PyYAML~=6.0
+torch~=2.0.0
+transformers~=4.28.1