mirror of
https://github.com/browser-use/browser-use
synced 2026-05-06 17:52:15 +02:00
109 lines
2.9 KiB
Python
109 lines
2.9 KiB
Python
import os
|
|
import sys
|
|
from pathlib import Path
|
|
|
|
from browser_use.agent.views import ActionResult
|
|
|
|
sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
|
|
import asyncio
|
|
import logging
|
|
|
|
from langchain_openai import ChatOpenAI
|
|
|
|
from browser_use import Agent, Controller
|
|
from browser_use.browser.browser import Browser, BrowserConfig
|
|
from browser_use.browser.context import BrowserContext
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
# Initialize controller first
|
|
browser = Browser(
|
|
config=BrowserConfig(
|
|
headless=False,
|
|
browser_binary_path='/Applications/Google Chrome.app/Contents/MacOS/Google Chrome',
|
|
)
|
|
)
|
|
controller = Controller()
|
|
|
|
|
|
@controller.action(
|
|
'Upload file to interactive element with file path ',
|
|
)
|
|
async def upload_file(index: int, path: str, browser: BrowserContext, available_file_paths: list[str]):
|
|
if path not in available_file_paths:
|
|
return ActionResult(error=f'File path {path} is not available')
|
|
|
|
if not os.path.exists(path):
|
|
return ActionResult(error=f'File {path} does not exist')
|
|
|
|
dom_el = await browser.get_dom_element_by_index(index)
|
|
|
|
file_upload_dom_el = dom_el.get_file_upload_element()
|
|
|
|
if file_upload_dom_el is None:
|
|
msg = f'No file upload element found at index {index}'
|
|
logger.info(msg)
|
|
return ActionResult(error=msg)
|
|
|
|
file_upload_el = await browser.get_locate_element(file_upload_dom_el)
|
|
|
|
if file_upload_el is None:
|
|
msg = f'No file upload element found at index {index}'
|
|
logger.info(msg)
|
|
return ActionResult(error=msg)
|
|
|
|
try:
|
|
await file_upload_el.set_input_files(path)
|
|
msg = f'Successfully uploaded file to index {index}'
|
|
logger.info(msg)
|
|
return ActionResult(extracted_content=msg, include_in_memory=True)
|
|
except Exception as e:
|
|
msg = f'Failed to upload file to index {index}: {str(e)}'
|
|
logger.info(msg)
|
|
return ActionResult(error=msg)
|
|
|
|
|
|
@controller.action('Read the file content of a file given a path')
|
|
async def read_file(path: str, available_file_paths: list[str]):
|
|
if path not in available_file_paths:
|
|
return ActionResult(error=f'File path {path} is not available')
|
|
|
|
with open(path, 'r') as f:
|
|
content = f.read()
|
|
msg = f'File content: {content}'
|
|
logger.info(msg)
|
|
return ActionResult(extracted_content=msg, include_in_memory=True)
|
|
|
|
|
|
def create_file(file_type: str = 'txt'):
|
|
with open(f'tmp.{file_type}', 'w') as f:
|
|
f.write('test')
|
|
file_path = Path.cwd() / f'tmp.{file_type}'
|
|
logger.info(f'Created file: {file_path}')
|
|
return str(file_path)
|
|
|
|
|
|
async def main():
|
|
task = 'Go to https://kzmpmkh2zfk1ojnpxfn1.lite.vusercontent.net/ and - read the file content and upload them to fields'
|
|
|
|
available_file_paths = [create_file('txt'), create_file('pdf'), create_file('csv')]
|
|
|
|
model = ChatOpenAI(model='gpt-4o')
|
|
agent = Agent(
|
|
task=task,
|
|
llm=model,
|
|
controller=controller,
|
|
browser=browser,
|
|
available_file_paths=available_file_paths,
|
|
)
|
|
|
|
await agent.run()
|
|
|
|
await browser.close()
|
|
|
|
input('Press Enter to close...')
|
|
|
|
|
|
if __name__ == '__main__':
|
|
asyncio.run(main())
|