File size: 1,497 Bytes
7b856a8 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 |
# Questions answering with Hugging Face embeddings. Adapted from the
# [LlamaIndex
# example](https://github.com/jerryjliu/gpt_index/blob/main/examples/gatsby/TestGatsby.ipynb).
import datasets
import numpy as np
from minichain import EmbeddingPrompt, TemplatePrompt, show_log, start_chain
# Load data with embeddings (computed beforehand)
gatsby = datasets.load_from_disk("gatsby")
gatsby.add_faiss_index("embeddings")
# Fast KNN retieval prompt
class KNNPrompt(EmbeddingPrompt):
def prompt(self, inp):
return inp["query"]
def find(self, out, inp):
res = gatsby.get_nearest_examples("embeddings", np.array(out), 1)
return {"question": inp["query"], "docs": res.examples["passages"]}
# QA prompt to ask question with examples
class QAPrompt(TemplatePrompt):
template_file = "gatsby.pmpt.tpl"
with start_chain("gatsby") as backend:
# question = "What did Gatsby do before he met Daisy?"
prompt = KNNPrompt(
backend.HuggingFaceEmbed("sentence-transformers/all-mpnet-base-v2")
).chain(QAPrompt(backend.OpenAI()))
# result = prompt(question)
# print(result)
gradio = prompt.to_gradio(fields=["query"],
examples=["What did Gatsby do before he met Daisy?"],
keys={"HF_KEY"})
if __name__ == "__main__":
gradio.launch()
# + tags=["hide_inp"]
# QAPrompt().show({"question": "Who was Gatsby?", "docs": ["doc1", "doc2", "doc3"]}, "")
# # -
# show_log("gatsby.log")
|