Skip to content

Commit f2f8cf8

Browse files
committed
Eval models
1 parent 88f018a commit f2f8cf8

File tree

4 files changed

+88
-0
lines changed

4 files changed

+88
-0
lines changed

eval/deepseek-r1.py

+24
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
import os
2+
3+
from dotenv import load_dotenv
4+
from langchain_openai import ChatOpenAI
5+
from pydantic import SecretStr
6+
7+
from browser_use import Agent
8+
9+
load_dotenv()
10+
11+
api_key_deepseek = os.getenv('DEEPSEEK_API_KEY', '')
12+
if not api_key_deepseek:
13+
raise ValueError('DEEPSEEK_API_KEY is not set')
14+
15+
16+
async def run_agent(task: str, max_steps: int = 38):
17+
llm = ChatOpenAI(
18+
base_url='https://api.deepseek.com/v1',
19+
model='deepseek-reasoner',
20+
api_key=SecretStr(api_key_deepseek),
21+
)
22+
agent = Agent(task=task, llm=llm, use_vision=False)
23+
result = await agent.run(max_steps=max_steps)
24+
return result

eval/deepseek.py

+24
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,24 @@
1+
import os
2+
3+
from dotenv import load_dotenv
4+
from langchain_openai import ChatOpenAI
5+
from pydantic import SecretStr
6+
7+
from browser_use import Agent
8+
9+
load_dotenv()
10+
11+
api_key_deepseek = os.getenv('DEEPSEEK_API_KEY', '')
12+
if not api_key_deepseek:
13+
raise ValueError('DEEPSEEK_API_KEY is not set')
14+
15+
16+
async def run_agent(task: str, max_steps: int = 38):
17+
llm = ChatOpenAI(
18+
base_url='https://api.deepseek.com/v1',
19+
model='deepseek-chat',
20+
api_key=SecretStr(api_key_deepseek),
21+
)
22+
agent = Agent(task=task, llm=llm, use_vision=False)
23+
result = await agent.run(max_steps=max_steps)
24+
return result

eval/gemini-1.5-flash.py

+20
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
import os
2+
3+
from dotenv import load_dotenv
4+
from langchain_google_genai import ChatGoogleGenerativeAI
5+
from pydantic import SecretStr
6+
7+
from browser_use import Agent
8+
9+
load_dotenv()
10+
11+
api_key = os.getenv('GEMINI_API_KEY', '')
12+
if not api_key:
13+
raise ValueError('GEMINI_API_KEY is not set')
14+
15+
16+
async def run_agent(task: str, max_steps: int = 38):
17+
llm = ChatGoogleGenerativeAI(model='gemini-1.5-flash-latest', api_key=SecretStr(api_key))
18+
agent = Agent(task=task, llm=llm)
19+
result = await agent.run(max_steps=max_steps)
20+
return result

eval/gemini-2.0-flash.py

+20
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,20 @@
1+
import os
2+
3+
from dotenv import load_dotenv
4+
from langchain_google_genai import ChatGoogleGenerativeAI
5+
from pydantic import SecretStr
6+
7+
from browser_use import Agent
8+
9+
load_dotenv()
10+
11+
api_key = os.getenv('GEMINI_API_KEY', '')
12+
if not api_key:
13+
raise ValueError('GEMINI_API_KEY is not set')
14+
15+
16+
async def run_agent(task: str, max_steps: int = 38):
17+
llm = ChatGoogleGenerativeAI(model='gemini-2.0-flash-exp', api_key=SecretStr(api_key))
18+
agent = Agent(task=task, llm=llm)
19+
result = await agent.run(max_steps=max_steps)
20+
return result

0 commit comments

Comments
 (0)