Skip to content

Commit a898cc9

Browse files
committed
Additional updates from 3.5 to 4o-mini and 4 to 4o
Signed-off-by: Mark Sze <[email protected]>
1 parent f8b5e55 commit a898cc9

26 files changed

+75
-99
lines changed

test/agentchat/contrib/agent_eval/test_agent_eval.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -38,13 +38,12 @@ def remove_ground_truth(test_case: str):
3838
filter_dict={
3939
"api_type": ["openai"],
4040
"model": [
41+
"gpt-4o-mini",
42+
"gpt-4o",
4143
"gpt-4-turbo",
4244
"gpt-4-turbo-preview",
4345
"gpt-4-0125-preview",
4446
"gpt-4-1106-preview",
45-
"gpt-3.5-turbo",
46-
"gpt-3.5-turbo-0125",
47-
"gpt-3.5-turbo-1106",
4847
],
4948
},
5049
)

test/agentchat/contrib/capabilities/chat_with_teachable_agent.py

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -17,12 +17,8 @@
1717
from test_assistant_agent import KEY_LOC, OAI_CONFIG_LIST # noqa: E402
1818

1919
# Specify the model to use. GPT-3.5 is less reliable than GPT-4 at learning from user input.
20-
filter_dict = {"model": ["gpt-4-0125-preview"]}
21-
# filter_dict = {"model": ["gpt-3.5-turbo-1106"]}
22-
# filter_dict = {"model": ["gpt-4-0613"]}
23-
# filter_dict = {"model": ["gpt-3.5-turbo"]}
24-
# filter_dict = {"model": ["gpt-4"]}
25-
# filter_dict = {"model": ["gpt-35-turbo-16k", "gpt-3.5-turbo-16k"]}
20+
filter_dict = {"model": ["gpt-4o-mini"]}
21+
# filter_dict = {"model": ["gpt-4-0125-preview"]}
2622

2723

2824
def create_teachable_agent(reset_db=False):

test/agentchat/contrib/capabilities/test_image_generation_capability.py

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@
3232
sys.path.append(os.path.join(os.path.dirname(__file__), "../.."))
3333
from conftest import MOCK_OPEN_AI_API_KEY, skip_openai # noqa: E402
3434

35-
filter_dict = {"model": ["gpt-35-turbo-16k", "gpt-3.5-turbo-16k"]}
35+
filter_dict = {"model": ["gpt-4o-mini"]}
3636

3737
RESOLUTIONS = ["256x256", "512x512", "1024x1024"]
3838
QUALITIES = ["standard", "hd"]
@@ -67,21 +67,21 @@ def api_key():
6767

6868
@pytest.fixture
6969
def dalle_config() -> Dict[str, Any]:
70-
config_list = openai_utils.config_list_from_models(model_list=["dall-e-2"], exclude="aoai")
70+
config_list = openai_utils.config_list_from_models(model_list=["dall-e-3"], exclude="aoai")
7171
if not config_list:
72-
config_list = [{"model": "dall-e-2", "api_key": api_key()}]
72+
config_list = [{"model": "dall-e-3", "api_key": api_key()}]
7373
return {"config_list": config_list, "timeout": 120, "cache_seed": None}
7474

7575

7676
@pytest.fixture
77-
def gpt3_config() -> Dict[str, Any]:
77+
def gpt4_config() -> Dict[str, Any]:
7878
config_list = [
7979
{
80-
"model": "gpt-35-turbo-16k",
80+
"model": "gpt-4o-mini",
8181
"api_key": api_key(),
8282
},
8383
{
84-
"model": "gpt-3.5-turbo-16k",
84+
"model": "gpt-4o",
8585
"api_key": api_key(),
8686
},
8787
]

test/agentchat/contrib/capabilities/test_teachable_agent.py

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -31,10 +31,8 @@
3131
# Specify the model to use by uncommenting one of the following lines.
3232
# filter_dict={"model": ["gpt-4-1106-preview"]}
3333
# filter_dict={"model": ["gpt-4-0613"]}
34-
# filter_dict={"model": ["gpt-3.5-turbo-1106"]}
35-
# filter_dict={"model": ["gpt-3.5-turbo-0613"]}
3634
# filter_dict={"model": ["gpt-4"]}
37-
filter_dict = {"tags": ["gpt-35-turbo-16k", "gpt-3.5-turbo-16k"]}
35+
filter_dict = {"tags": ["gpt-4o-mini"]}
3836

3937

4038
def create_teachable_agent(reset_db=False, verbosity=0):

test/agentchat/contrib/capabilities/test_transform_messages.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -33,7 +33,7 @@ def test_transform_messages_capability():
3333
OAI_CONFIG_LIST,
3434
KEY_LOC,
3535
filter_dict={
36-
"model": "gpt-3.5-turbo",
36+
"model": "gpt-4o-mini",
3737
},
3838
)
3939

test/agentchat/contrib/test_agent_builder.py

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -51,8 +51,8 @@ def test_build():
5151
builder = AgentBuilder(
5252
config_file_or_env=OAI_CONFIG_LIST,
5353
config_file_location=KEY_LOC,
54-
builder_model_tags=["gpt-4"],
55-
agent_model_tags=["gpt-4"],
54+
builder_model_tags=["gpt-4o"],
55+
agent_model_tags=["gpt-4o"],
5656
)
5757
building_task = (
5858
"Find a paper on arxiv by programming, and analyze its application in some domain. "
@@ -83,8 +83,8 @@ def test_build_from_library():
8383
builder = AgentBuilder(
8484
config_file_or_env=OAI_CONFIG_LIST,
8585
config_file_location=KEY_LOC,
86-
builder_model_tags=["gpt-4"],
87-
agent_model_tags=["gpt-4"],
86+
builder_model_tags=["gpt-4o"],
87+
agent_model_tags=["gpt-4o"],
8888
)
8989
building_task = (
9090
"Find a paper on arxiv by programming, and analyze its application in some domain. "
@@ -136,8 +136,8 @@ def test_save():
136136
builder = AgentBuilder(
137137
config_file_or_env=OAI_CONFIG_LIST,
138138
config_file_location=KEY_LOC,
139-
builder_model_tags=["gpt-4"],
140-
agent_model_tags=["gpt-4"],
139+
builder_model_tags=["gpt-4o"],
140+
agent_model_tags=["gpt-4o"],
141141
)
142142
building_task = (
143143
"Find a paper on arxiv by programming, and analyze its application in some domain. "
@@ -175,8 +175,8 @@ def test_load():
175175
config_file_location=KEY_LOC,
176176
# builder_model=["gpt-4", "gpt-4-1106-preview"],
177177
# agent_model=["gpt-4", "gpt-4-1106-preview"],
178-
builder_model_tags=["gpt-4"],
179-
agent_model_tags=["gpt-4"],
178+
builder_model_tags=["gpt-4o"],
179+
agent_model_tags=["gpt-4o"],
180180
)
181181

182182
config_save_path = f"{here}/example_test_agent_builder_config.json"
@@ -204,8 +204,8 @@ def test_clear_agent():
204204
builder = AgentBuilder(
205205
config_file_or_env=OAI_CONFIG_LIST,
206206
config_file_location=KEY_LOC,
207-
builder_model_tags=["gpt-4"],
208-
agent_model_tags=["gpt-4"],
207+
builder_model_tags=["gpt-4o"],
208+
agent_model_tags=["gpt-4o"],
209209
)
210210

211211
config_save_path = f"{here}/example_test_agent_builder_config.json"

test/agentchat/contrib/test_gpt_assistant.py

Lines changed: 0 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -40,9 +40,6 @@
4040
"gpt-4-turbo-preview",
4141
"gpt-4-0125-preview",
4242
"gpt-4-1106-preview",
43-
"gpt-3.5-turbo",
44-
"gpt-3.5-turbo-0125",
45-
"gpt-3.5-turbo-1106",
4643
],
4744
},
4845
)

test/agentchat/contrib/test_llamaindex_conversable_agent.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ def test_group_chat_with_llama_index_conversable_agent(chat_mock: MagicMock) ->
4848
Each agent is set to describe an image in a unique style, but the chat should not exceed the specified max_rounds.
4949
"""
5050
llm = OpenAI(
51-
model="gpt-4",
51+
model="gpt-4o",
5252
temperature=0.0,
5353
api_key=openaiKey,
5454
)

test/agentchat/contrib/test_reasoning_agent.py

Lines changed: 5 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -43,7 +43,7 @@ def think_node():
4343
@pytest.fixture
4444
def reasoning_agent():
4545
"""Create a ReasoningAgent instance for testing"""
46-
config_list = [{"model": "gpt-4", "api_key": "fake_key"}]
46+
config_list = [{"model": "gpt-4o", "api_key": "fake_key"}]
4747
llm_config = {"config_list": config_list, "temperature": 0}
4848
return ReasoningAgent("reasoning_agent", llm_config=llm_config)
4949

@@ -164,7 +164,10 @@ def test_reasoning_agent_answer():
164164

165165
def helper_test_reasoning_agent_answer(max_depth, beam_size, answer_approach):
166166
"""Test that ReasoningAgent properly terminates when TERMINATE is received"""
167-
mock_config = {"config_list": [{"model": "gpt-4", "api_key": "fake", "base_url": "0.0.0.0:8000"}], "temperature": 0}
167+
mock_config = {
168+
"config_list": [{"model": "gpt-4o", "api_key": "fake", "base_url": "0.0.0.0:8000"}],
169+
"temperature": 0,
170+
}
168171
with patch("autogen.agentchat.conversable_agent.ConversableAgent.generate_oai_reply") as mock_oai_reply:
169172
agent = ReasoningAgent(
170173
"test_agent",

test/agentchat/test_agent_logging.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,7 @@
5050
config_list = autogen.config_list_from_json(
5151
OAI_CONFIG_LIST,
5252
filter_dict={
53-
"tags": ["gpt-3.5-turbo"],
53+
"tags": ["gpt-4o-mini"],
5454
},
5555
file_location=KEY_LOC,
5656
)

0 commit comments

Comments
 (0)