Spaces:

srush
/

minichain

Running

minichain / gatsby.py

srush HF staff

Upload with huggingface_hub

7b856a8 almost 2 years ago

1.5 kB

	# Questions answering with Hugging Face embeddings. Adapted from the
	# [LlamaIndex
	# example](https://github.com/jerryjliu/gpt_index/blob/main/examples/gatsby/TestGatsby.ipynb).

	import datasets
	import numpy as np

	from minichain import EmbeddingPrompt, TemplatePrompt, show_log, start_chain

	# Load data with embeddings (computed beforehand)

	gatsby = datasets.load_from_disk("gatsby")
	gatsby.add_faiss_index("embeddings")

	# Fast KNN retieval prompt

	class KNNPrompt(EmbeddingPrompt):
	def prompt(self, inp):
	return inp["query"]

	def find(self, out, inp):
	res = gatsby.get_nearest_examples("embeddings", np.array(out), 1)
	return {"question": inp["query"], "docs": res.examples["passages"]}

	# QA prompt to ask question with examples


	class QAPrompt(TemplatePrompt):
	template_file = "gatsby.pmpt.tpl"


	with start_chain("gatsby") as backend:
	# question = "What did Gatsby do before he met Daisy?"
	prompt = KNNPrompt(
	backend.HuggingFaceEmbed("sentence-transformers/all-mpnet-base-v2")
	).chain(QAPrompt(backend.OpenAI()))
	# result = prompt(question)
	# print(result)


	gradio = prompt.to_gradio(fields=["query"],
	examples=["What did Gatsby do before he met Daisy?"],
	keys={"HF_KEY"})
	if __name__ == "__main__":
	gradio.launch()



	# + tags=["hide_inp"]
	# QAPrompt().show({"question": "Who was Gatsby?", "docs": ["doc1", "doc2", "doc3"]}, "")
	# # -

	# show_log("gatsby.log")