-
Notifications
You must be signed in to change notification settings - Fork 2.6k
Expand file tree
/
Copy pathbrowser.py
More file actions
89 lines (69 loc) · 2.96 KB
/
browser.py
File metadata and controls
89 lines (69 loc) · 2.96 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
import asyncio
import base64
import os
from playwright.sync_api import sync_playwright, TimeoutError, Page
from playwright.async_api import async_playwright, TimeoutError
from markdownify import markdownify as md
from pdfminer.high_level import extract_text
from src.socket_instance import emit_agent
from src.config import Config
from src.state import AgentState
class Browser:
def __init__(self):
self.playwright = None
self.browser = None
self.page = None
self.agent = AgentState()
async def start(self):
self.playwright = await async_playwright().start()
self.browser = await self.playwright.chromium.launch(headless=True)
self.page = await self.browser.new_page()
return self
# def new_page(self):
# return self.browser.new_page()
async def go_to(self, url):
try:
await self.page.goto(url, timeout=20000)
except TimeoutError as e:
print(f"TimeoutError: {e} when trying to navigate to {url}")
return False
return True
async def screenshot(self, project_name):
screenshots_save_path = Config().get_screenshots_dir()
page_metadata = await self.page.evaluate("() => { return { url: document.location.href, title: document.title } }")
page_url = page_metadata['url']
random_filename = os.urandom(20).hex()
filename_to_save = f"{random_filename}.png"
path_to_save = os.path.join(screenshots_save_path, filename_to_save)
await self.page.emulate_media(media="screen")
await self.page.screenshot(path=path_to_save, full_page=True)
screenshot = await self.page.screenshot()
screenshot_bytes = base64.b64encode(screenshot).decode()
new_state = self.agent.new_state()
new_state["internal_monologue"] = "Browsing the web right now..."
new_state["browser_session"]["url"] = page_url
new_state["browser_session"]["screenshot"] = path_to_save
self.agent.add_to_current_state(project_name, new_state)
# self.close()
return path_to_save, screenshot_bytes
def get_html(self):
return self.page.content()
def get_markdown(self):
return md(self.page.content())
def get_pdf(self):
pdfs_save_path = Config().get_pdfs_dir()
page_metadata = self.page.evaluate("() => { return { url: document.location.href, title: document.title } }")
filename_to_save = f"{page_metadata['title']}.pdf"
save_path = os.path.join(pdfs_save_path, filename_to_save)
self.page.pdf(path=save_path)
return save_path
def pdf_to_text(self, pdf_path):
return extract_text(pdf_path).strip()
def get_content(self):
pdf_path = self.get_pdf()
return self.pdf_to_text(pdf_path)
def extract_text(self):
return self.page.evaluate("() => document.body.innerText")
async def close(self):
await self.page.close()
await self.browser.close()