Spaces:

fkonovalenko
/

llm4career

Sleeping

fkonovalenko commited on Apr 25, 2024

Commit

d99e452

1 Parent(s): f05530b

first commit

Files changed (3) hide show

app.py CHANGED Viewed

@@ -12,7 +12,6 @@ class GlobalState:
     result_file_path = os.path.join(os.path.dirname(__file__), 'result/archive.json')
     result_dir = os.path.join(os.path.dirname(__file__), 'result')
     bert_path = os.path.join(os.path.dirname(__file__), 'tiny.pt')
-    catboost_path = os.path.join(os.path.dirname(__file__), 'best_cat.joblib')
     conv_classes = {0: 'low',
                     1: 'middle',
                     2: 'high'
@@ -72,7 +71,7 @@ def append_to_json(_dict, path):
 def predict(btn):
-    analyzer = VacancyAnalyzer(GlobalState.bert_path, GlobalState.catboost_path, GlobalState.data)
     status, result = analyzer.classify()
     gr.Info(status)
     if result != 'unknown':

     result_file_path = os.path.join(os.path.dirname(__file__), 'result/archive.json')
     result_dir = os.path.join(os.path.dirname(__file__), 'result')
     bert_path = os.path.join(os.path.dirname(__file__), 'tiny.pt')
     conv_classes = {0: 'low',
                     1: 'middle',
                     2: 'high'
 def predict(btn):
+    analyzer = VacancyAnalyzer(GlobalState.bert_path, GlobalState.data)
     status, result = analyzer.classify()
     gr.Info(status)
     if result != 'unknown':

ml.py CHANGED Viewed

@@ -1,5 +1,4 @@
 import pandas as pd
-from catboost import Pool
 import joblib
 import torch
 import re
@@ -8,9 +7,8 @@ from llm import TransformerRegrModel
 class VacancyAnalyzer:
-    def __init__(self, transformer_path: str, catboost_path: str, inputs: dict):
         self.transformer_path = transformer_path
-        self.catboost_path = catboost_path
         self.inputs = pd.DataFrame(inputs, index=[0]).drop(columns=['conversion', 'conversion_class', 'id'], axis=1)
         self.cat_features = ['profession', 'grade', 'location']
         self.text_features = ['emp_brand', 'mandatory', 'additional', 'comp_stages', 'work_conditions']
@@ -21,13 +19,6 @@ class VacancyAnalyzer:
         txt = re.sub(r'([\n\t]*)', r'', txt)
         return txt
-    def predict(self) -> float:
-        df = self.inputs.drop(columns=self.text_features, axis=1)
-        pool = Pool(df, cat_features=self.cat_features)
-        regressor = joblib.load(self.catboost_path)
-        prediction = regressor.predict(pool).tolist()
-        return prediction[0]
     def classify(self) -> tuple:
         df = self.inputs[self.text_features]
         description = df[self.text_features[0]].values[0] + ' '

 import pandas as pd
 import joblib
 import torch
 import re
 class VacancyAnalyzer:
+    def __init__(self, transformer_path: str, inputs: dict):
         self.transformer_path = transformer_path
         self.inputs = pd.DataFrame(inputs, index=[0]).drop(columns=['conversion', 'conversion_class', 'id'], axis=1)
         self.cat_features = ['profession', 'grade', 'location']
         self.text_features = ['emp_brand', 'mandatory', 'additional', 'comp_stages', 'work_conditions']
         txt = re.sub(r'([\n\t]*)', r'', txt)
         return txt
     def classify(self) -> tuple:
         df = self.inputs[self.text_features]
         description = df[self.text_features[0]].values[0] + ' '

tiny.pt ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c505eb64cc6dd292b8823ff2d996f84ff199ff0ce5117aaef95ddcffe1c6cefc
+size 116799348