Spaces:

Ekimetrics
/

climate-question-answering

Running

App Files Files Community

TheoLvs commited on Oct 19, 2023

Commit

c6d27fe

1 Parent(s): 65eb787

Added streamign

Browse files

Files changed (3) hide show

app.py +91 -74
climateqa/chains.py +9 -5
climateqa/custom_retrieval_chain.py +63 -0

app.py CHANGED Viewed

@@ -68,89 +68,77 @@ from langchain.callbacks.base import BaseCallbackHandler
 from queue import Queue, Empty
 from threading import Thread
 from collections.abc import Generator
-# Create a Queue
-Q = Queue()
-class QueueCallback(BaseCallbackHandler):
-    """Callback handler for streaming LLM responses to a queue."""
-    def __init__(self, q):
         self.q = q
-    def on_llm_new_token(self, token: str, **kwargs: any) -> None:
         self.q.put(token)
-    def on_llm_end(self, *args, **kwargs: any) -> None:
-        return self.q.empty()
 # Create embeddings function and LLM
 embeddings_function = HuggingFaceEmbeddings(model_name = "sentence-transformers/multi-qa-mpnet-base-dot-v1")
-llm = get_llm(max_tokens = 1024,temperature = 0.0,verbose = True,streaming = True,
-    callbacks=[QueueCallback(Q)],
 )
 # Create vectorstore and retriever
 vectorstore = get_pinecone_vectorstore(embeddings_function)
 retriever = ClimateQARetriever(vectorstore=vectorstore,sources = ["IPCC"],k_summary = 3,k_total = 10)
-chain = load_climateqa_chain(retriever,llm)
 #---------------------------------------------------------------------------
 # ClimateQ&A Streaming
 # From https://github.com/gradio-app/gradio/issues/5345
 #---------------------------------------------------------------------------
-# Create a function that will return our generator
-def stream(chain, input_text) -> Generator:
-    with Q.mutex:
-        Q.queue.clear()
-    job_done = object()
-    # Create a function to call - this will run in a thread
-    def task():
-        answer = chain({"query":input_text,"audience":"expert climate scientist"})
-        Q.put(job_done)
-    # Create a thread and start the function
-    t = Thread(target=task)
-    t.start()
-    content = ""
-    # Get each new token from the queue and yield for our generator
-    while True:
-        try:
-            next_token = Q.get(True, timeout=1)
-            if next_token is job_done:
-                break
-            content += next_token
-            yield next_token, content
-        except Empty:
-            continue
-def stream_sentences(chain, input_text) -> Generator:
-    """wrapper to stream function"""
-    sentence = ""
-    for next_token, content in stream(chain, input_text):
-        sentence += next_token
-        if "\n\n" in next_token:
-            yield sentence
-            sentence = ""
-    if sentence:
-        yield sentence
 def answer_user(message,history):
     return message, history + [[message, None]]
 def answer_bot(message,history,audience):
     if audience == "Children":
@@ -170,25 +158,39 @@ def answer_bot(message,history,audience):
     # for next_token, content in stream(message):
     #     yield(content)
-    output = chain({"query":message,"audience":audience_prompt})
-    question = output["question"]
-    sources = output["source_documents"]
-    if len(sources) > 0:
-        sources_text = []
-        for i, d in enumerate(sources, 1):
-            sources_text.append(make_html_source(d,i))
-        sources_text = "\n\n".join([f"Query used for retrieval:\n{question}"] + sources_text)
-        history[-1][1] = output["answer"]
-        return "",history,sources_text
-    else:
-        sources_text = "⚠️ No relevant passages found in the climate science reports (IPCC and IPBES)"
-        complete_response = "**⚠️ No relevant passages found in the climate science reports (IPCC and IPBES), you may want to ask a more specific question (specifying your question on climate issues).**"
-        history[-1][1] = complete_response
-        return "",history, sources_text
 #---------------------------------------------------------------------------
 # ClimateQ&A core functions
@@ -348,7 +350,19 @@ def log_on_azure(file, logs, share_client):
 # --------------------------------------------------------------------
 with gr.Blocks(title="🌍 Climate Q&A", css="style.css", theme=theme) as demo:
@@ -363,7 +377,9 @@ with gr.Blocks(title="🌍 Climate Q&A", css="style.css", theme=theme) as demo:
         with gr.Row(elem_id="chatbot-row"):
             with gr.Column(scale=2):
                 # state = gr.State([system_template])
-                bot = gr.Chatbot(show_copy_button=True,show_label = False,elem_id="chatbot",layout = "panel",avatar_images = ("assets/logo4.png",None))
                 with gr.Row(elem_id = "input-message"):
                     textbox=gr.Textbox(placeholder="Ask me anything here!",show_label=False,scale=7)
@@ -441,7 +457,6 @@ with gr.Blocks(title="🌍 Climate Q&A", css="style.css", theme=theme) as demo:
             examples_hidden.change(answer_user, [examples_hidden, bot], [textbox, bot], queue=False).then(
                     answer_bot, [textbox,bot,dropdown_audience], [textbox,bot,sources_textbox]
                 )
             submit_button.click(answer_user, [textbox, bot], [textbox, bot], queue=False).then(
                     answer_bot, [textbox,bot,dropdown_audience], [textbox,bot,sources_textbox]
                 )
@@ -619,6 +634,8 @@ Or around 2 to 4 times more than a typical Google search.
 - ClimateQ&A on Hugging Face is finally working again with all the new features !
 - Switched all python code to langchain codebase for cleaner code, easier maintenance and future features
 - Updated GPT model to August version
 - Use of HuggingFace embed on https://climateqa.com to avoid demultiplying deployments
 ##### v1.0.0 - *2023-05-11*

 from queue import Queue, Empty
 from threading import Thread
 from collections.abc import Generator
+from langchain.schema import LLMResult
+from typing import Any, Union,Dict,List
+from queue import SimpleQueue
+# # Create a Queue
+# Q = Queue()
+Q = SimpleQueue()
+job_done = object() # signals the processing is done
+class StreamingGradioCallbackHandler(BaseCallbackHandler):
+    def __init__(self, q: SimpleQueue):
         self.q = q
+    def on_llm_start(
+        self, serialized: Dict[str, Any], prompts: List[str], **kwargs: Any
+    ) -> None:
+        """Run when LLM starts running. Clean the queue."""
+        while not self.q.empty():
+            try:
+                self.q.get(block=False)
+            except Empty:
+                continue
+    def on_llm_new_token(self, token: str, **kwargs: Any) -> None:
+        """Run on new LLM token. Only available when streaming is enabled."""
         self.q.put(token)
+    def on_llm_end(self, response: LLMResult, **kwargs: Any) -> None:
+        """Run when LLM ends running."""
+        self.q.put(job_done)
+    def on_llm_error(
+        self, error: Union[Exception, KeyboardInterrupt], **kwargs: Any
+    ) -> None:
+        """Run when LLM errors."""
+        self.q.put(job_done)
 # Create embeddings function and LLM
 embeddings_function = HuggingFaceEmbeddings(model_name = "sentence-transformers/multi-qa-mpnet-base-dot-v1")
+llm_reformulation = get_llm(max_tokens = 512,temperature = 0.0,verbose = True,streaming = False)
+llm_streaming = get_llm(max_tokens = 1024,temperature = 0.0,verbose = True,streaming = True,
+    callbacks=[StreamingGradioCallbackHandler(Q),StreamingStdOutCallbackHandler()],
 )
 # Create vectorstore and retriever
 vectorstore = get_pinecone_vectorstore(embeddings_function)
 retriever = ClimateQARetriever(vectorstore=vectorstore,sources = ["IPCC"],k_summary = 3,k_total = 10)
+chain = load_climateqa_chain(retriever,llm_reformulation,llm_streaming)
 #---------------------------------------------------------------------------
 # ClimateQ&A Streaming
 # From https://github.com/gradio-app/gradio/issues/5345
+# And https://stackoverflow.com/questions/76057076/how-to-stream-agents-response-in-langchain
 #---------------------------------------------------------------------------
+from threading import Thread
+def threaded_chain(query,audience):
+    response = chain({"query":query,"audience":audience})
+    Q.put(response)
+    Q.put(job_done)
 def answer_user(message,history):
     return message, history + [[message, None]]
 def answer_bot(message,history,audience):
     if audience == "Children":
     # for next_token, content in stream(message):
     #     yield(content)
+    thread = Thread(target=threaded_chain, kwargs={"query":message,"audience":audience_prompt})
+    thread.start()
+    history[-1][1] = ""
+    while True:
+        next_item = Q.get(block=True) # Blocks until an input is available
+        if next_item is job_done:
+            continue
+        elif isinstance(next_item, dict):  # assuming LLMResult is a dictionary
+            response = next_item
+            if "source_documents" in response and len(response["source_documents"]) > 0:
+                sources_text = []
+                for i, d in enumerate(response["source_documents"], 1):
+                    sources_text.append(make_html_source(d, i))
+                sources_text = "\n\n".join([f"Query used for retrieval:\n{response['question']}"] + sources_text)
+                # history[-1][1] += next_item["answer"]
+                # history[-1][1] += "\n\n" + sources_text
+                yield "", history, sources_text
+            else:
+                sources_text = "⚠️ No relevant passages found in the scientific reports (IPCC and IPBES)"
+                complete_response = "**⚠️ No relevant passages found in the climate science reports (IPCC and IPBES), you may want to ask a more specific question (specifying your question on climate and biodiversity issues).**"
+                history[-1][1] += "\n\n" + complete_response
+                yield "", history, sources_text
+            break
+        elif isinstance(next_item, str):
+            history[-1][1] += next_item
+            yield "", history, ""
+    thread.join()
 #---------------------------------------------------------------------------
 # ClimateQ&A core functions
 # --------------------------------------------------------------------
+init_prompt = """
+Hello ! I am ClimateQ&A, a conversational assistant designed to help you understand climate change and biodiversity loss. I will answer your questions by **sifting through the IPCC and IPBES scientific reports**.
+💡 How to use
+- **Language**: You can ask me your questions in any language.
+- **Audience**: You can specify your audience (children, general public, experts) to get a more adapted answer.
+- **Sources**: You can choose to search in the IPCC or IPBES reports, or both.
+📚 Limitations
+*Please note that the AI is not perfect and may sometimes give irrelevant answers. If you are not satisfied with the answer, please ask a more specific question or report your feedback to help us improve the system.*
+❓ What do you want to learn ?
+"""
 with gr.Blocks(title="🌍 Climate Q&A", css="style.css", theme=theme) as demo:
         with gr.Row(elem_id="chatbot-row"):
             with gr.Column(scale=2):
                 # state = gr.State([system_template])
+                bot = gr.Chatbot(
+                    value=[[None,init_prompt]],
+                    show_copy_button=True,show_label = False,elem_id="chatbot",layout = "panel",avatar_images = ("assets/logo4.png",None))
                 with gr.Row(elem_id = "input-message"):
                     textbox=gr.Textbox(placeholder="Ask me anything here!",show_label=False,scale=7)
             examples_hidden.change(answer_user, [examples_hidden, bot], [textbox, bot], queue=False).then(
                     answer_bot, [textbox,bot,dropdown_audience], [textbox,bot,sources_textbox]
                 )
             submit_button.click(answer_user, [textbox, bot], [textbox, bot], queue=False).then(
                     answer_bot, [textbox,bot,dropdown_audience], [textbox,bot,sources_textbox]
                 )
 - ClimateQ&A on Hugging Face is finally working again with all the new features !
 - Switched all python code to langchain codebase for cleaner code, easier maintenance and future features
 - Updated GPT model to August version
+- Added streaming response to improve UX
+- Created a custom Retriever chain to avoid calling the LLM if there is no documents retrieved
 - Use of HuggingFace embed on https://climateqa.com to avoid demultiplying deployments
 ##### v1.0.0 - *2023-05-11*

climateqa/chains.py CHANGED Viewed

@@ -8,7 +8,7 @@ from langchain.chains import TransformChain, SequentialChain
 from langchain.chains.qa_with_sources import load_qa_with_sources_chain
 from climateqa.prompts import answer_prompt, reformulation_prompt,audience_prompts
 def load_reformulation_chain(llm):
@@ -38,6 +38,7 @@ def load_reformulation_chain(llm):
 def load_answer_chain(retriever,llm):
     prompt = PromptTemplate(template=answer_prompt, input_variables=["summaries", "question","audience","language"])
     qa_chain = load_qa_with_sources_chain(llm, chain_type="stuff",prompt = prompt)
@@ -45,24 +46,27 @@ def load_answer_chain(retriever,llm):
     # This could be improved by providing a document prompt to avoid modifying page_content in the docs
     # See here https://github.com/langchain-ai/langchain/issues/3523
-    answer_chain = RetrievalQAWithSourcesChain(
         combine_documents_chain = qa_chain,
         retriever=retriever,
         return_source_documents = True,
     )
     return answer_chain
-def load_climateqa_chain(retriever,llm):
-    reformulation_chain = load_reformulation_chain(llm)
-    answer_chain = load_answer_chain(retriever,llm)
     climateqa_chain = SequentialChain(
         chains = [reformulation_chain,answer_chain],
         input_variables=["query","audience"],
         output_variables=["answer","question","language","source_documents"],
         return_all = True,
     )
     return climateqa_chain

 from langchain.chains.qa_with_sources import load_qa_with_sources_chain
 from climateqa.prompts import answer_prompt, reformulation_prompt,audience_prompts
+from climateqa.custom_retrieval_chain import CustomRetrievalQAWithSourcesChain
 def load_reformulation_chain(llm):
 def load_answer_chain(retriever,llm):
     prompt = PromptTemplate(template=answer_prompt, input_variables=["summaries", "question","audience","language"])
     qa_chain = load_qa_with_sources_chain(llm, chain_type="stuff",prompt = prompt)
     # This could be improved by providing a document prompt to avoid modifying page_content in the docs
     # See here https://github.com/langchain-ai/langchain/issues/3523
+    answer_chain = CustomRetrievalQAWithSourcesChain(
         combine_documents_chain = qa_chain,
         retriever=retriever,
         return_source_documents = True,
+        verbose = True,
+        fallback_answer="**⚠️ No relevant passages found in the climate science reports (IPCC and IPBES), you may want to ask a more specific question (specifying your question on climate issues).**",
     )
     return answer_chain
+def load_climateqa_chain(retriever,llm_reformulation,llm_answer):
+    reformulation_chain = load_reformulation_chain(llm_reformulation)
+    answer_chain = load_answer_chain(retriever,llm_answer)
     climateqa_chain = SequentialChain(
         chains = [reformulation_chain,answer_chain],
         input_variables=["query","audience"],
         output_variables=["answer","question","language","source_documents"],
         return_all = True,
+        verbose = True,
     )
     return climateqa_chain

climateqa/custom_retrieval_chain.py ADDED Viewed

	@@ -0,0 +1,63 @@

+from __future__ import annotations
+import inspect
+from typing import Any, Dict, List, Optional
+from pydantic import Extra
+from langchain.schema.language_model import BaseLanguageModel
+from langchain.callbacks.manager import (
+    AsyncCallbackManagerForChainRun,
+    CallbackManagerForChainRun,
+)
+from langchain.chains.base import Chain
+from langchain.prompts.base import BasePromptTemplate
+from typing import Any, Dict, List
+from langchain.callbacks.manager import (
+    AsyncCallbackManagerForChainRun,
+    CallbackManagerForChainRun,
+)
+from langchain.chains.combine_documents.stuff import StuffDocumentsChain
+from langchain.chains.qa_with_sources.base import BaseQAWithSourcesChain
+from langchain.docstore.document import Document
+from langchain.pydantic_v1 import Field
+from langchain.schema import BaseRetriever
+from langchain.chains import RetrievalQAWithSourcesChain
+from langchain.chains.router.llm_router import LLMRouterChain
+class CustomRetrievalQAWithSourcesChain(RetrievalQAWithSourcesChain):
+    fallback_answer:str = "No sources available to answer this question."
+    def _call(self,inputs,run_manager=None):
+        _run_manager = run_manager or CallbackManagerForChainRun.get_noop_manager()
+        accepts_run_manager = (
+            "run_manager" in inspect.signature(self._get_docs).parameters
+        )
+        if accepts_run_manager:
+            docs = self._get_docs(inputs, run_manager=_run_manager)
+        else:
+            docs = self._get_docs(inputs)  # type: ignore[call-arg]
+        if len(docs) == 0:
+            answer = self.fallback_answer
+            sources = []
+        else:
+            answer = self.combine_documents_chain.run(
+                input_documents=docs, callbacks=_run_manager.get_child(), **inputs
+            )
+            answer, sources = self._split_sources(answer)
+        result: Dict[str, Any] = {
+            self.answer_key: answer,
+            self.sources_answer_key: sources,
+        }
+        if self.return_source_documents:
+            result["source_documents"] = docs
+        return result