Spaces:

jfeng1115
/

marketing-analytics-bot

Runtime error

App Files Files Community

marketing-analytics-bot / langchain /llms /huggingface_pipeline.py

jfeng1115

init commit

58d33f0 9 months ago

raw history blame contribute delete

No virus

5.76 kB

	"""Wrapper around HuggingFace Pipeline APIs."""
	import importlib.util
	import logging
	from typing import Any, List, Mapping, Optional

	from pydantic import BaseModel, Extra

	from langchain.llms.base import LLM
	from langchain.llms.utils import enforce_stop_tokens

	DEFAULT_MODEL_ID = "gpt2"
	DEFAULT_TASK = "text-generation"
	VALID_TASKS = ("text2text-generation", "text-generation")

	logger = logging.getLogger()


	class HuggingFacePipeline(LLM, BaseModel):
	"""Wrapper around HuggingFace Pipeline API.

	To use, you should have the ``transformers`` python package installed.

	Only supports `text-generation` and `text2text-generation` for now.

	Example using from_model_id:
	.. code-block:: python

	from langchain.llms import HuggingFacePipeline
	hf = HuggingFacePipeline.from_model_id(
	model_id="gpt2", task="text-generation"
	)
	Example passing pipeline in directly:
	.. code-block:: python

	from langchain.llms import HuggingFacePipeline
	from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline

	model_id = "gpt2"
	tokenizer = AutoTokenizer.from_pretrained(model_id)
	model = AutoModelForCausalLM.from_pretrained(model_id)
	pipe = pipeline(
	"text-generation", model=model, tokenizer=tokenizer, max_new_tokens=10
	)
	hf = HuggingFacePipeline(pipeline=pipe)
	"""

	pipeline: Any #: :meta private:
	model_id: str = DEFAULT_MODEL_ID
	"""Model name to use."""
	model_kwargs: Optional[dict] = None
	"""Key word arguments to pass to the model."""

	class Config:
	"""Configuration for this pydantic object."""

	extra = Extra.forbid

	@classmethod
	def from_model_id(
	cls,
	model_id: str,
	task: str,
	device: int = -1,
	model_kwargs: Optional[dict] = None,
	**kwargs: Any,
	) -> LLM:
	"""Construct the pipeline object from model_id and task."""
	try:
	from transformers import (
	AutoModelForCausalLM,
	AutoModelForSeq2SeqLM,
	AutoTokenizer,
	)
	from transformers import pipeline as hf_pipeline

	except ImportError:
	raise ValueError(
	"Could not import transformers python package. "
	"Please it install it with `pip install transformers`."
	)

	_model_kwargs = model_kwargs or {}
	tokenizer = AutoTokenizer.from_pretrained(model_id, **_model_kwargs)

	try:
	if task == "text-generation":
	model = AutoModelForCausalLM.from_pretrained(model_id, **_model_kwargs)
	elif task == "text2text-generation":
	model = AutoModelForSeq2SeqLM.from_pretrained(model_id, **_model_kwargs)
	else:
	raise ValueError(
	f"Got invalid task {task}, "
	f"currently only {VALID_TASKS} are supported"
	)
	except ImportError as e:
	raise ValueError(
	f"Could not load the {task} model due to missing dependencies."
	) from e

	if importlib.util.find_spec("torch") is not None:
	import torch

	cuda_device_count = torch.cuda.device_count()
	if device < -1 or (device >= cuda_device_count):
	raise ValueError(
	f"Got device=={device}, "
	f"device is required to be within [-1, {cuda_device_count})"
	)
	if device < 0 and cuda_device_count > 0:
	logger.warning(
	"Device has %d GPUs available. "
	"Provide device={deviceId} to `from_model_id` to use available"
	"GPUs for execution. deviceId is -1 (default) for CPU and "
	"can be a positive integer associated with CUDA device id.",
	cuda_device_count,
	)

	pipeline = hf_pipeline(
	task=task,
	model=model,
	tokenizer=tokenizer,
	device=device,
	model_kwargs=_model_kwargs,
	)
	if pipeline.task not in VALID_TASKS:
	raise ValueError(
	f"Got invalid task {pipeline.task}, "
	f"currently only {VALID_TASKS} are supported"
	)
	return cls(
	pipeline=pipeline,
	model_id=model_id,
	model_kwargs=_model_kwargs,
	**kwargs,
	)

	@property
	def _identifying_params(self) -> Mapping[str, Any]:
	"""Get the identifying parameters."""
	return {
	**{"model_id": self.model_id},
	**{"model_kwargs": self.model_kwargs},
	}

	@property
	def _llm_type(self) -> str:
	return "huggingface_pipeline"

	def _call(self, prompt: str, stop: Optional[List[str]] = None) -> str:
	response = self.pipeline(prompt)
	if self.pipeline.task == "text-generation":
	# Text generation return includes the starter text.
	text = response[0]["generated_text"][len(prompt) :]
	elif self.pipeline.task == "text2text-generation":
	text = response[0]["generated_text"]
	else:
	raise ValueError(
	f"Got invalid task {self.pipeline.task}, "
	f"currently only {VALID_TASKS} are supported"
	)
	if stop is not None:
	# This is a bit hacky, but I can't figure out a better way to enforce
	# stop tokens when making calls to huggingface_hub.
	text = enforce_stop_tokens(text, stop)
	return text