Spaces:

luisrodriguesphd
/

resume-worth

Sleeping

App Files Files Community

luisrodriguesphd commited on May 10

Commit

9c79212

•

1 Parent(s): 1ab7f5d

feat: update llm provider to groq and model to llama 3 8b

Browse files

Files changed (7) hide show

Dockerfile +4 -2
conf/.env.example +3 -0
conf/params.yml +9 -5
requirements.in +1 -0
src/resume_worth/pipelines/text_generation/nodes.py +65 -17
src/resume_worth/pipelines/text_generation/pipeline.py +5 -2
src/resume_worth/utils/utils.py +17 -0

Dockerfile CHANGED Viewed

@@ -21,6 +21,9 @@ ENV MPLCONFIGDIR=$MPLCONFIGDIR
 ARG ENTRYPOINT_PATH="./entrypoint.sh"
 ENV ENTRYPOINT_PATH=$ENTRYPOINT_PATH
 # Create the /code/ directory a ser permissions rwe
 RUN mkdir -p /code/&& \
     chmod -R 777 /code/
@@ -55,7 +58,6 @@ COPY . .
 RUN pip install -e . && \
     python src/resume_worth/pipelines/data_indexing/pipeline.py
-RUN python src/resume_worth/pipelines/text_generation/pipeline.py && \
-    chmod +x $ENTRYPOINT_PATH
 ENTRYPOINT $ENTRYPOINT_PATH

 ARG ENTRYPOINT_PATH="./entrypoint.sh"
 ENV ENTRYPOINT_PATH=$ENTRYPOINT_PATH
+# RUN --mount=type=secret,id=GROQ_API_KEY,mode=0444,required=true \
+#     echo "GROQ_API_KEY=$(cat /run/secrets/GROQ_API_KEY)"
 # Create the /code/ directory a ser permissions rwe
 RUN mkdir -p /code/&& \
     chmod -R 777 /code/
 RUN pip install -e . && \
     python src/resume_worth/pipelines/data_indexing/pipeline.py
+RUN chmod +x $ENTRYPOINT_PATH
 ENTRYPOINT $ENTRYPOINT_PATH

conf/.env.example CHANGED Viewed

@@ -1,3 +1,6 @@
 # OpenAI (to text generation)
 OPENAI_API_KEY=""
 OPENAI_ORG_ID=""

+# Groq Cloud (to text generation)
+GROQ_API_KEY="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"
 # OpenAI (to text generation)
 OPENAI_API_KEY=""
 OPENAI_ORG_ID=""

conf/params.yml CHANGED Viewed

@@ -1,3 +1,8 @@
 # Data
 ingestion_data_dir: ["data", "02_processed"]
 ingestion_metadata_dir: ["data", "02_processed", "metadata"]
@@ -16,16 +21,15 @@ embedding_dir: ["data", "03_indexed"]
 # LLM / Text Generation
 # See instructions for parameters: https://www.ibm.com/docs/en/watsonx-as-a-service?topic=lab-model-parameters-prompting
 generative_model:
-    model_name: "M4-ai/tau-1.8B"
     model_kwargs:
-        trust_remote_code: True
-    generate_kwargs:
-        top_k: 30
         top_p: 0.7
         temperature: 0.3
-        max_new_tokens: 256
 # See instructions for the prompt: https://huggingface.co/spaces/Locutusque/Locutusque-Models/blob/main/app.py
 prompt_dir: ["data", "04_prompts"]
 promp_file: "prompt_template_for_explaning_why_is_a_good_fit.json"

+# Conf
+conf_dir: ["conf"]
+secrets_file: ".env"
 # Data
 ingestion_data_dir: ["data", "02_processed"]
 ingestion_metadata_dir: ["data", "02_processed", "metadata"]
 # LLM / Text Generation
+# Suggestion: huggingface|M4-ai/tau-1.8B; groq|llama3-8b-8192
 # See instructions for parameters: https://www.ibm.com/docs/en/watsonx-as-a-service?topic=lab-model-parameters-prompting
 generative_model:
+    model_provider: "groq"
+    model_name: "llama3-8b-8192"
     model_kwargs:
         top_p: 0.7
+    generate_kwargs:
         temperature: 0.3
 # See instructions for the prompt: https://huggingface.co/spaces/Locutusque/Locutusque-Models/blob/main/app.py
 prompt_dir: ["data", "04_prompts"]
 promp_file: "prompt_template_for_explaning_why_is_a_good_fit.json"

requirements.in CHANGED Viewed

@@ -7,6 +7,7 @@ pandas
 # to build LLM Apps
 langchain
 langchain-community
 sentence-transformers>=2.3.1
 chromadb

 # to build LLM Apps
 langchain
 langchain-community
+langchain_groq
 sentence-transformers>=2.3.1
 chromadb

src/resume_worth/pipelines/text_generation/nodes.py CHANGED Viewed

@@ -1,8 +1,11 @@
 import os
 os.environ['HF_HOME'] = ".cache/huggingface"
 from langchain_community.llms.huggingface_pipeline import HuggingFacePipeline
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
 from langchain_core.prompts import PromptTemplate
 from langchain.prompts import load_prompt
 from functools import lru_cache
@@ -13,26 +16,71 @@ transformers.logging.set_verbosity_error()
 #@lru_cache(maxsize=None)
 def load_hf_text_generation_model_to_langchain(
-    model_name:str='gpt2',
-    model_kwargs:dict={
-            'trust_remote_code': True,
-    },
-    generate_kwargs:dict={
-            'top_k': 50,
-            'top_p': 0.95,
-            'temperature': 0.4,
-            'max_new_tokens': 1024,
-        }
     ):
     """
-    Function to load a text generation model hosted on Hugging Face to se used in LangChain.
     More info, see: https://python.langchain.com/docs/integrations/llms/huggingface_pipelines/
     """
-    print(f"-> Load a pretrained text embedding model {model_name}")
-    # https://huggingface.co/apple/OpenELM
     tokenizer = AutoTokenizer.from_pretrained(model_name, **model_kwargs)
     model = AutoModelForCausalLM.from_pretrained(model_name, **model_kwargs)
@@ -68,10 +116,10 @@ def load_langchain_prompt_template(promp_path: str):
     return prompt
-def create_langchain_chain(prompt: PromptTemplate, hf_text_generation: HuggingFacePipeline):
     """
-    Create a chain by composing the HF text generation model with a LangChain prompt template.
     More info, see: https://python.langchain.com/docs/integrations/llms/huggingface_pipelines/
     """
-    chain = prompt | hf_text_generation
     return chain

 import os
 os.environ['HF_HOME'] = ".cache/huggingface"
+from typing import Union
+from resume_worth.utils.utils import set_secrets
 from langchain_community.llms.huggingface_pipeline import HuggingFacePipeline
 from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
+from langchain_groq import ChatGroq
 from langchain_core.prompts import PromptTemplate
 from langchain.prompts import load_prompt
 from functools import lru_cache
 #@lru_cache(maxsize=None)
+def load_text_generation_model(
+        model_provider:str='groq',
+        model_name:str='llama3-8b-8192',
+        model_kwargs:dict={},
+        generate_kwargs:dict={
+                'temperature': 0.4,
+            },
+    ):
+    """Function to load a text generation model according to the provider."""
+    print(f"-> Load {model_name} text generation model from {model_provider}")
+    if model_provider=="huggingface":
+        return load_hf_text_generation_model_to_langchain(model_name, model_kwargs, generate_kwargs)
+    elif model_provider=="groq":
+        set_secrets()
+        return load_groq_text_generation_model_to_langchain(model_name, model_kwargs, generate_kwargs)
+    else:
+        raise Exception("Sorry, the code has no support for this provider yet.")
+def load_groq_text_generation_model_to_langchain(
+        model_name:str='llama3-8b-8192',
+        model_kwargs:dict={
+                'top_k': 50,
+                'top_p': 0.95,
+                'max_new_tokens': 1024,
+            },
+        generate_kwargs:dict={
+                'temperature': 0.4,
+            }
+    ):
+    """
+    Function to load a text generation model hosted on Groq to be used in LangChain.
+    More info, see: https://console.groq.com/docs/quickstart
+    """
+    groq_api_key = os.environ.get('GROQ_API_KEY', None)
+    if groq_api_key is None:
+        raise ValueError("GROQ_API_KEY is not set.")
+    groq = ChatGroq(model_name=model_name, model_kwargs=model_kwargs, **generate_kwargs, groq_api_key=groq_api_key)
+    return groq
 def load_hf_text_generation_model_to_langchain(
+        model_name:str='gpt2',
+        model_kwargs:dict={
+                'trust_remote_code': True,
+            },
+        generate_kwargs:dict={
+                'top_k': 50,
+                'top_p': 0.95,
+                'temperature': 0.4,
+                'max_new_tokens': 1024,
+            }
     ):
     """
+    Function to load a text generation model hosted on Hugging Face to be used in LangChain.
     More info, see: https://python.langchain.com/docs/integrations/llms/huggingface_pipelines/
     """
     tokenizer = AutoTokenizer.from_pretrained(model_name, **model_kwargs)
     model = AutoModelForCausalLM.from_pretrained(model_name, **model_kwargs)
     return prompt
+def create_langchain_chain(prompt: PromptTemplate, text_generation_model: Union[HuggingFacePipeline, ChatGroq]):
     """
+    Create a chain by composing the text generation model with a LangChain prompt template.
     More info, see: https://python.langchain.com/docs/integrations/llms/huggingface_pipelines/
     """
+    chain = prompt | text_generation_model
     return chain

src/resume_worth/pipelines/text_generation/pipeline.py CHANGED Viewed

@@ -7,7 +7,7 @@ This pipeline utilizes an LLM to explain why the retrieved job vacancy is a good
 import os
 from resume_worth.utils.utils import get_params
-from resume_worth.pipelines.text_generation.nodes import load_hf_text_generation_model_to_langchain, load_langchain_prompt_template, create_langchain_chain
 params = get_params()
@@ -20,7 +20,7 @@ def generate_explanation_why_resume_for_a_job(resume: str, job: str):
     # Stage 1 - [cacheable] Load text generation model
-    text_generation_model = load_hf_text_generation_model_to_langchain(generative_model['model_name'], generative_model['model_kwargs'], generative_model['generate_kwargs'])
     # Stage 2 - [cacheable] Load text generation model
@@ -35,6 +35,9 @@ def generate_explanation_why_resume_for_a_job(resume: str, job: str):
     answer = text_generation_chain.invoke({"resume": resume, "job": job})
     return answer

 import os
 from resume_worth.utils.utils import get_params
+from resume_worth.pipelines.text_generation.nodes import load_text_generation_model, load_langchain_prompt_template, create_langchain_chain
 params = get_params()
     # Stage 1 - [cacheable] Load text generation model
+    text_generation_model = load_text_generation_model(generative_model['model_provider'], generative_model['model_name'], generative_model['model_kwargs'], generative_model['generate_kwargs'])
     # Stage 2 - [cacheable] Load text generation model
     answer = text_generation_chain.invoke({"resume": resume, "job": job})
+    if generative_model['model_provider']!="huggingface":
+        answer = answer.content
     return answer

src/resume_worth/utils/utils.py CHANGED Viewed

@@ -4,6 +4,7 @@ os.environ['HF_HOME'] = ".cache/huggingface"
 import yaml
 from langchain_community.embeddings import HuggingFaceEmbeddings
 import fitz # imports the pymupdf library
 def get_params():
@@ -25,6 +26,22 @@ def get_params():
     return params
 def load_embedding_model(model_name: str = "sentence-transformers/all-mpnet-base-v2", model_kwargs: dict={}, encode_kwargs: dict={}):
     """Load a pretrained text embedding model"""

 import yaml
 from langchain_community.embeddings import HuggingFaceEmbeddings
 import fitz # imports the pymupdf library
+from functools import lru_cache
 def get_params():
     return params
+@lru_cache(maxsize=None)
+def set_secrets():
+    """
+    Function to set the secrets.
+    It load the parameters from .env file and set as env vars.
+    """
+    params = get_params()
+    secrets_path = os.path.join(params['conf_dir'], params['secrets_file'])
+    if os.path.exists(secrets_path):
+        from dotenv import load_dotenv
+        _ = load_dotenv(secrets_path)
+    else:
+        print(f'The secret file {secrets_path} does not exist!')
 def load_embedding_model(model_name: str = "sentence-transformers/all-mpnet-base-v2", model_kwargs: dict={}, encode_kwargs: dict={}):
     """Load a pretrained text embedding model"""