lavague / app.py
Daniel Huynh
feat: woorking demo
8042b49
raw
history blame
6.49 kB
import gradio as gr
from lavague.ActionEngine import ActionEngine
from lavague.defaults import DefaultLocalLLM, DefaultLLM
from llama_index.llms.huggingface import HuggingFaceInferenceAPI
import base64
import requests
import uuid
import re
MAX_CHARS = 1500
USER_ID = str(uuid.uuid4())
SERVER_URL = "https://lavague.mithrilsecurity.io"
# Use this action_engine instead to have a local inference
# action_engine = ActionEngine(llm=DefaultLocalLLM())
action_engine = ActionEngine()
title = """
<div align="center">
<h1>🌊 Welcome to LaVague</h1>
<p>Redefining internet surfing by transforming natural language instructions into seamless browser interactions.</p>
</div>
"""
# action_engine = ActionEngine(llm, embedder)
def exec_code_req(url, code):
headers = {
"X-User-ID": USER_ID # Include the X-User-ID header for authentication
}
try:
response = requests.post(SERVER_URL + "/execute_req", json={"url": url, "requests": code}, headers=headers)
if response.status_code == 200:
return response.json()
else:
return {"error": f"Failed with status code {response.status_code}"}
except requests.RequestException as e:
return {"error": str(e)}
def get_html(url):
headers = {
"X-User-ID": USER_ID # Include the X-User-ID header for authentication
}
try:
response = requests.post(SERVER_URL + "/get_html", json={"url": url}, headers=headers)
if response.status_code == 200:
return response.json()
else:
return {"error": f"Failed with status code {response.status_code}"}
except requests.RequestException as e:
return {"error": str(e)}
def send_request(url):
headers = {
"X-User-ID": USER_ID # Include the X-User-ID header for authentication
}
try:
response = requests.get(SERVER_URL + "/screenshot", params={"url": url}, headers=headers)
if response.status_code == 200:
return response.json()
else:
return {"error": f"Failed with status code {response.status_code}"}
except requests.RequestException as e:
return {"error": str(e)}
def process_url(url):
r = send_request(url)
f = open("screenshot.png", "wb")
scr = base64.b64decode(r["result"])
f.write(scr)
return "screenshot.png"
def process_instruction(query, url_input):
r = get_html(url_input)
state = r["html"]
query_engine = action_engine.get_query_engine(state)
response = query_engine.query(query)
source_nodes = response.get_formatted_sources(MAX_CHARS)
return response.response, source_nodes
def extract_first_python_code(markdown_text):
# Pattern to match the first ```python ``` code block
pattern = r"```python(.*?)```"
# Using re.DOTALL to make '.' match also newlines
match = re.search(pattern, markdown_text, re.DOTALL)
if match:
# Return the first matched group, which is the code inside the ```python ```
return match.group(1).strip()
else:
# Return None if no match is found
return None
def exec_code(code, source_nodes, full_code, url):
code = extract_first_python_code(code)
html = ""
try:
r = exec_code_req(url, code)
url = r["url"]
html = r["html"]
output = "Successful code execution"
status = """<p style="color: green; font-size: 20px; font-weight: bold;">Success!</p>"""
full_code += code
except Exception as e:
output = f"Error in code execution: {str(e)}"
status = """<p style="color: red; font-size: 20px; font-weight: bold;">Failure! Open the Debug tab for more information</p>"""
return output, code, html, status, full_code, url
def update_image_display(img, url):
r = send_request(url)
f = open("screenshot.png", "wb")
scr = base64.b64decode(r["result"])
f.write(scr)
return "screenshot.png", url
def show_processing_message():
return "Processing..."
def create_demo(base_url, instructions):
with gr.Blocks() as demo:
with gr.Tab("LaVague"):
with gr.Row():
gr.HTML(title)
with gr.Row():
url_input = gr.Textbox(value=base_url, label="Enter URL and press 'Enter' to load the page.")
with gr.Row():
with gr.Column(scale=7):
image_display = gr.Image(label="Browser", interactive=False)
with gr.Column(scale=3):
with gr.Accordion(label="Full code", open=False):
full_code = gr.Code(value="", language="python", interactive=False)
code_display = gr.Code(label="Generated code", language="python",
lines=5, interactive=True)
status_html = gr.HTML()
with gr.Row():
with gr.Column(scale=8):
text_area = gr.Textbox(label="Enter instructions and press 'Enter' to generate code.")
gr.Examples(examples=instructions, inputs=text_area)
with gr.Tab("Debug"):
with gr.Row():
with gr.Column():
log_display = gr.Textbox(interactive=False, lines=20)
with gr.Column():
source_display = gr.Code(language="html", label="Retrieved nodes", interactive=False, lines=20)
with gr.Row():
with gr.Accordion(label="Full HTML", open=False):
full_html = gr.Code(language="html", label="Full HTML", interactive=False, lines=20)
# Linking components
url_input.submit(process_url, inputs=url_input, outputs=image_display)
text_area.submit(show_processing_message, outputs=[status_html]).then(
process_instruction, inputs=[text_area, url_input], outputs=[code_display, source_display]
).then(
exec_code, inputs=[code_display, source_display, full_code, url_input],
outputs=[log_display, code_display, full_html, status_html, full_code, url_input]
).then(
update_image_display, inputs=[image_display, url_input], outputs=[image_display, url_input]
)
demo.launch(share=True, debug=True)
base_url = "https://huggingface.co/"
instructions = ["Click on the Datasets item on the menu, between Models and Spaces",
"Click on the search bar 'Filter by name', type 'The Stack', and press 'Enter'",
"Scroll by 500 pixels",]
create_demo(base_url, instructions)