Spaces:

kingabzpro
/

Real-Time-RAG

Running

App Files Files Community

Abid Ali Awan commited on Aug 31, 2024

Commit

dbc2cc3

1 Parent(s): c84dd0f

improve the text trigger function

Browse files

Files changed (1) hide show

app.py +14 -7

app.py CHANGED Viewed

@@ -1,11 +1,12 @@
 import os
 import gradio as gr
 from langchain_core.output_parsers import StrOutputParser
 from langchain_core.runnables import RunnablePassthrough
 from langchain_groq import ChatGroq
 from langchain_huggingface import HuggingFaceEmbeddings
-from langchain_chroma import Chroma
-from langchain_core.prompts import PromptTemplate
 # Load the API key from environment variables
 groq_api_key = os.getenv("Groq_API_Key")
@@ -14,8 +15,9 @@ groq_api_key = os.getenv("Groq_API_Key")
 llm = ChatGroq(model="llama-3.1-70b-versatile", api_key=groq_api_key)
 # Initialize the embedding model
-embed_model = HuggingFaceEmbeddings(model_name="mixedbread-ai/mxbai-embed-large-v1",
-                                    model_kwargs = {'device': 'cpu'})
 # Load the vector store from a local directory
 vectorstore = Chroma(
@@ -48,6 +50,7 @@ rag_chain = (
     | StrOutputParser()
 )
 # Define the function to stream the RAG memory
 def rag_memory_stream(text):
     partial_text = ""
@@ -56,6 +59,7 @@ def rag_memory_stream(text):
         # Yield the updated conversation history
         yield partial_text
 # Set up the Gradio interface
 title = "Real-time AI App with Groq API and LangChain"
 description = """
@@ -68,15 +72,18 @@ demo = gr.Interface(
     title=title,
     description=description,
     fn=rag_memory_stream,
-    inputs="text",
-    outputs="text",
     live=True,
     batch=True,
     max_batch_size=10000,
     concurrency_limit=12,
     allow_flagging="never",
     theme=gr.themes.Soft(),
-    trigger_mode="always_last",
 )
 # Launch the Gradio interface

 import os
 import gradio as gr
+from langchain_chroma import Chroma
 from langchain_core.output_parsers import StrOutputParser
+from langchain_core.prompts import PromptTemplate
 from langchain_core.runnables import RunnablePassthrough
 from langchain_groq import ChatGroq
 from langchain_huggingface import HuggingFaceEmbeddings
 # Load the API key from environment variables
 groq_api_key = os.getenv("Groq_API_Key")
 llm = ChatGroq(model="llama-3.1-70b-versatile", api_key=groq_api_key)
 # Initialize the embedding model
+embed_model = HuggingFaceEmbeddings(
+    model_name="mixedbread-ai/mxbai-embed-large-v1", model_kwargs={"device": "cpu"}
+)
 # Load the vector store from a local directory
 vectorstore = Chroma(
     | StrOutputParser()
 )
 # Define the function to stream the RAG memory
 def rag_memory_stream(text):
     partial_text = ""
         # Yield the updated conversation history
         yield partial_text
 # Set up the Gradio interface
 title = "Real-time AI App with Groq API and LangChain"
 description = """
     title=title,
     description=description,
     fn=rag_memory_stream,
+    inputs=gr.Textbox(
+        label="Enter your Star Wars question:",
+        trigger_mode="always_last",
+        default="Who is luke?",
+    ),
+    outputs=gr.Textbox(label="Awnser:", default="...", trigger_mode="auto"),
     live=True,
     batch=True,
     max_batch_size=10000,
     concurrency_limit=12,
     allow_flagging="never",
     theme=gr.themes.Soft(),
 )
 # Launch the Gradio interface