[Add] browser-use and main.py

This commit is contained in:
tv0924@icloud.com 2025-05-18 21:57:54 +09:00
commit 96914d44ac
221 changed files with 30952 additions and 1 deletions

View file

@ -0,0 +1,19 @@
from dotenv import load_dotenv
from langchain_anthropic import ChatAnthropic
from browser_use import Agent, Browser
load_dotenv()
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatAnthropic(
model_name='claude-3-5-sonnet-20240620',
temperature=0.0,
timeout=100,
stop=None,
)
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,19 @@
from dotenv import load_dotenv
from langchain_anthropic import ChatAnthropic
from browser_use import Agent, Browser
load_dotenv()
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatAnthropic(
model_name='claude-3-5-sonnet-20241022',
temperature=0.0,
timeout=100,
stop=None,
)
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,19 @@
from dotenv import load_dotenv
from langchain_anthropic import ChatAnthropic
from browser_use import Agent, Browser
load_dotenv()
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatAnthropic(
model_name='claude-3-7-sonnet-20250219',
temperature=0.0,
timeout=100,
stop=None,
)
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,25 @@
import os
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from pydantic import SecretStr
from browser_use import Agent, Browser
load_dotenv()
api_key_deepseek = os.getenv('DEEPSEEK_API_KEY', '')
if not api_key_deepseek:
raise ValueError('DEEPSEEK_API_KEY is not set')
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatOpenAI(
base_url='https://api.deepseek.com/v1',
model='deepseek-reasoner',
api_key=SecretStr(api_key_deepseek),
)
agent = Agent(task=task, llm=llm, use_vision=False, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,25 @@
import os
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from pydantic import SecretStr
from browser_use import Agent, Browser
load_dotenv()
api_key_deepseek = os.getenv('DEEPSEEK_API_KEY', '')
if not api_key_deepseek:
raise ValueError('DEEPSEEK_API_KEY is not set')
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatOpenAI(
base_url='https://api.deepseek.com/v1',
model='deepseek-chat',
api_key=SecretStr(api_key_deepseek),
)
agent = Agent(task=task, llm=llm, use_vision=False, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,21 @@
import os
from dotenv import load_dotenv
from langchain_google_genai import ChatGoogleGenerativeAI
from pydantic import SecretStr
from browser_use import Agent, Browser
load_dotenv()
api_key = os.getenv('GOOGLE_API_KEY', '')
if not api_key:
raise ValueError('GOOGLE_API_KEY is not set')
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatGoogleGenerativeAI(model='gemini-1.5-flash-latest', api_key=SecretStr(api_key))
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,21 @@
import os
from dotenv import load_dotenv
from langchain_google_genai import ChatGoogleGenerativeAI
from pydantic import SecretStr
from browser_use import Agent, Browser
load_dotenv()
api_key = os.getenv('GOOGLE_API_KEY', '')
if not api_key:
raise ValueError('GOOGLE_API_KEY is not set')
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatGoogleGenerativeAI(model='gemini-2.0-flash-exp', api_key=SecretStr(api_key))
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,21 @@
import os
from dotenv import load_dotenv
from langchain_google_genai import ChatGoogleGenerativeAI
from pydantic import SecretStr
from browser_use import Agent, Browser
load_dotenv()
api_key = os.getenv('GOOGLE_API_KEY', '')
if not api_key:
raise ValueError('GOOGLE_API_KEY is not set')
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatGoogleGenerativeAI(model='gemini-2.5-pro-preview-03-25', api_key=SecretStr(api_key))
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,17 @@
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from browser_use import Agent, Browser
load_dotenv()
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatOpenAI(
model='gpt-4.1-2025-04-14',
temperature=0.0,
)
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,25 @@
import asyncio
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from browser_use import Agent, Browser
load_dotenv()
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
browser.config.new_context_config.highlight_elements = False
llm = ChatOpenAI(
model='gpt-4o',
temperature=0.0,
)
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result
if __name__ == '__main__':
task = 'Open 1 random Wikipedia pages in new tab'
result = asyncio.run(run_agent(task))

View file

@ -0,0 +1,17 @@
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from browser_use import Agent, Browser
load_dotenv()
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatOpenAI(
model='gpt-4o',
temperature=0.0,
)
agent = Agent(task=task, llm=llm, use_vision=False, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,26 @@
import asyncio
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from browser_use import Agent, Browser
load_dotenv()
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatOpenAI(
model='gpt-4o',
temperature=0.0,
)
browser.config.new_context_config.viewport_expansion = 0
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result
if __name__ == '__main__':
task = 'Go to https://www.google.com and search for "python" and click on the first result'
result = asyncio.run(run_agent(task))
print(result)

View file

@ -0,0 +1,17 @@
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from browser_use import Agent, Browser
load_dotenv()
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatOpenAI(
model='gpt-4o',
temperature=0.0,
)
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

View file

@ -0,0 +1,16 @@
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from browser_use import Agent, Browser
load_dotenv()
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
llm = ChatOpenAI(
model='o4-mini-2025-04-16',
)
agent = Agent(task=task, llm=llm, browser=browser)
result = await agent.run(max_steps=max_steps)
return result

25
browser-use/eval/grok.py Normal file
View file

@ -0,0 +1,25 @@
import os
from dotenv import load_dotenv
from langchain_openai import ChatOpenAI
from pydantic import SecretStr
from browser_use import Agent, Browser
load_dotenv()
api_key = os.getenv('GROK_API_KEY', '')
if not api_key:
raise ValueError('GROK_API_KEY is not set')
async def run_agent(task: str, browser: Browser | None = None, max_steps: int = 38):
browser = browser or Browser()
agent = Agent(
task=task,
use_vision=False,
llm=ChatOpenAI(model='grok-3-beta', base_url='https://api.x.ai/v1', api_key=SecretStr(api_key)),
browser=browser,
)
await agent.run()

1343
browser-use/eval/service.py Normal file

File diff suppressed because it is too large Load diff