Langchain RAG mix chat history and sources return

Question

I'm developing a small api using langChain and FastAPI and I'm having trouble mixing chat history and returning the source. I can't find an example in the documentation or that mixes the two. I've seen that ConversationRetrievalChain allows you to return the source and add memory, but I don't think it works with RAG and custom templates. Has anyone encountered the same difficulties, and if so, have you found a solution?

from fastapi import FastAPI
from langchain.vectorstores import FAISS
from langchain.chat_models import ChatOpenAI
from langchain_core.prompts import ChatPromptTemplate
from langchain_core.output_parsers import StrOutputParser
from langchain_core.prompts import ChatPromptTemplate
from langchain_core.runnables import RunnablePassthrough
from langchain.embeddings import OpenAIEmbeddings
from langchain_core.runnables import RunnableParallel
import pandas as pd

model = ChatOpenAI(model_name="gpt-3.5-turbo", temperature=0.7)
embeddings = OpenAIEmbeddings()

vectorstore = FAISS.load_local("products_metadata", embeddings, allow_dangerous_deserialization=True)
retriever = vectorstore.as_retriever()

products = pd.read_json('./data/products.json', orient='records', lines=True)

def format_docs(docs):
    return "

".join(doc.page_content for doc in docs)

app = FastAPI(
    title="LangChain Server",
    version="1.0",
    description="Spin up a simple api server using Langchain's Runnable interfaces",
)

ANSWER_TEMPLATE ="""Answer the question with an introductory sentence and use the following contextual elements to answer the question. Format the context as follows: - product name, brand, country, returning to the line between each product.   
Context: {context}   
Question: {question}  
Answer: """

ANSWER_PROMPT = ChatPromptTemplate.from_template(ANSWER_TEMPLATE)

rag_chain_from_docs = (
    RunnablePassthrough.assign(context=(lambda x: format_docs(x["context"])))
    | ANSWER_PROMPT
    | model
    | StrOutputParser()
)

rag_chain_with_source = RunnableParallel(
    {"context": retriever, "question": RunnablePassthrough()}
).assign(answer=rag_chain_from_docs)

from pydantic import BaseModel
class Question(BaseModel):
    question: str

@app.post("/invoke")
def test(question: Question):
    test = rag_chain_with_source.invoke(question.question)
    return test

@app.get("/products")
def get_products():
    return products.to_dict(orient='records')

@app.get("/products/{product_id}")
def get_product(product_id: int):
    product = products[products['code'] == product_id]
    return product.to_dict(orient='records')

if __name__ == "__main__":
    import uvicorn

    uvicorn.run(app, host="localhost", port=8000)

Langchain RAG mix chat history and sources return

Answers (1)

Related Questions