splitted into files

aditya30051993 · Sep 17, 2024 · fa42415 · fa42415
1 parent eb2d520
commit fa42415
Show file tree

Hide file tree

Showing 9 changed files with 224 additions and 273 deletions.
diff --git a/app/api/pdf.py b/app/api/pdf.py
diff --git a/app/api/routes.py b/app/api/routes.py
@@ -0,0 +1,35 @@
+from fastapi import APIRouter, UploadFile, File
+from app.utils.html_processing import upload_html
+from app.utils.pdf_processing import process_pdf
+from app.core.ollama_manager import qa_chain
+from app.core.selenium_driver import driver, apply_action_on_driver
+import json
+
+router = APIRouter()
+
+@router.post("/upload_pdf/")
+async def upload_pdf(file: UploadFile = File(...)):
+    return await process_pdf(file)
+
+@router.get("/search_pdf/")
+async def search(query: str):
+    result = qa_chain.invoke({"query": query})
+    return result
+
+@router.get("/assistant/")
+async def assistant(query: str):
+    html = driver.page_source
+    url = driver.current_url
+    upload_html(html, url)
+
+    result = qa_chain.invoke({"query": query})
+    action_response = {}
+
+    try:
+        action_response = json.loads(result.get("result"))
+    except:
+        pass
+
+    apply_action_on_driver(action_response)
+
+    return result
diff --git a/app/core/milvus_manager.py b/app/core/milvus_manager.py
@@ -0,0 +1,13 @@
+from langchain_huggingface import HuggingFaceEmbeddings
+from langchain_community.vectorstores import Milvus
+
+embedding_function = HuggingFaceEmbeddings(
+    model_name="all-MiniLM-L6-v2", 
+    show_progress=True
+)
+
+vector_store = Milvus(
+    embedding_function=embedding_function,
+    collection_name="_browser_session",
+    auto_id=True,
+)
diff --git a/app/core/ollama_manager.py b/app/core/ollama_manager.py
@@ -0,0 +1,51 @@
+from langchain_community.llms import Ollama
+from langchain.callbacks.manager import CallbackManager
+from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
+from langchain.chains import RetrievalQA
+from app.core.milvus_manager import vector_store
+from langchain.prompts.chat import ChatPromptTemplate
+
+llm = Ollama(
+    model="llama3.1",
+    callback_manager=CallbackManager([StreamingStdOutCallbackHandler()]),
+    stop=["<|eot_id|>"],
+    base_url="http://192.168.6.201:9000",
+)
+
+prompt_template = """
+You are a Selenium browser assistant. You will receive a page URL, a parent XPATH, and text to work with. Additionally, you will be given a user query. Only from the context DOM, provide instructions to the Selenium driver for navigating, scrolling, clicking, or inputting if they are intended by the query. You must always provide the response with a summary of the information extracted based on the query or respond with how these actions can result in the requested information.
+
+Return the result strictly in JSON format:
+{{
+  "action": [],
+  "response": ""
+}}
+
+If nothing relevant is found in the context DOM and no specific URL is intended to be visited from the query, respond with: action with visit with search_query, query made to search on Google with the intent to find relevant information:
+{{
+  "action": [
+    {{
+      "type": "visit",
+      "url": "{{search_query}}"
+    }}
+  ],
+  "response": "No relevant information found. Consider searching on Google with the query: {{search_query}}."
+}}
+
+Ensure that this schema is strictly followed:
+- Actions should only come from the CONTEXT DOM.
+- Actions should only be for clicking or inputting.
+- If a specific URL is provided in the query, visit that URL.
+- If no specific URL is provided and nothing relevant is found in the CONTEXT DOM, only then share a action to visit for {{search_query}}.
+
+Question: {question} 
+Context: {context}
+"""
+
+chat_prompt = ChatPromptTemplate([("system", prompt_template)])
+
+qa_chain = RetrievalQA.from_chain_type(
+    llm,
+    retriever=vector_store.as_retriever(),
+    chain_type_kwargs={"prompt": chat_prompt},
+)