Skip to content

Commit

Permalink
use gpt-4o-mini for tests
Browse files Browse the repository at this point in the history
  • Loading branch information
ekzhu committed Oct 1, 2024
1 parent 00941b0 commit 0448fe6
Show file tree
Hide file tree
Showing 10 changed files with 12 additions and 33 deletions.
2 changes: 1 addition & 1 deletion notebook/agentchat_function_call_currency_calculator.ipynb
Original file line number Diff line number Diff line change
Expand Up @@ -65,7 +65,7 @@
"\n",
"config_list = autogen.config_list_from_json(\n",
" \"OAI_CONFIG_LIST\",\n",
" filter_dict={\"tags\": [\"tools\"]}, # comment out to get all\n",
" filter_dict={\"tags\": [\"tool\"]}, # comment out to get all\n",
")"
]
},
Expand Down
7 changes: 1 addition & 6 deletions test/agentchat/contrib/agent_eval/test_agent_eval.py
Original file line number Diff line number Diff line change
Expand Up @@ -32,13 +32,8 @@ def remove_ground_truth(test_case: str):
filter_dict={
"api_type": ["openai"],
"model": [
"gpt-4-turbo",
"gpt-4-turbo-preview",
"gpt-4-0125-preview",
"gpt-4-1106-preview",
"gpt-4o-mini",
"gpt-3.5-turbo",
"gpt-3.5-turbo-0125",
"gpt-3.5-turbo-1106",
],
},
)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,8 @@
from test_assistant_agent import KEY_LOC, OAI_CONFIG_LIST # noqa: E402

# Specify the model to use. GPT-3.5 is less reliable than GPT-4 at learning from user input.
filter_dict = {"model": ["gpt-4-0125-preview"]}
filter_dict = {"model": ["gpt-4o-mini"]}
# filter_dict = {"model": ["gpt-4-0125-preview"]}
# filter_dict = {"model": ["gpt-3.5-turbo-1106"]}
# filter_dict = {"model": ["gpt-4-0613"]}
# filter_dict = {"model": ["gpt-3.5-turbo"]}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -26,8 +26,6 @@
sys.path.append(os.path.join(os.path.dirname(__file__), "../.."))
from conftest import MOCK_OPEN_AI_API_KEY, skip_openai # noqa: E402

filter_dict = {"model": ["gpt-35-turbo-16k", "gpt-3.5-turbo-16k"]}

RESOLUTIONS = ["256x256", "512x512", "1024x1024"]
QUALITIES = ["standard", "hd"]
PROMPTS = [
Expand Down
3 changes: 2 additions & 1 deletion test/agentchat/contrib/capabilities/test_teachable_agent.py
Original file line number Diff line number Diff line change
Expand Up @@ -28,7 +28,8 @@
# filter_dict={"model": ["gpt-3.5-turbo-1106"]}
# filter_dict={"model": ["gpt-3.5-turbo-0613"]}
# filter_dict={"model": ["gpt-4"]}
filter_dict = {"tags": ["gpt-35-turbo-16k", "gpt-3.5-turbo-16k"]}
# filter_dict = {"tags": ["gpt-35-turbo-16k", "gpt-3.5-turbo-16k"]}
filter_dict={"model": ["gpt-4o-mini"]}


def create_teachable_agent(reset_db=False, verbosity=0):
Expand Down
2 changes: 1 addition & 1 deletion test/agentchat/test_tool_calls.py
Original file line number Diff line number Diff line change
Expand Up @@ -144,7 +144,7 @@ def test_update_tool():
config_list_gpt4 = autogen.config_list_from_json(
OAI_CONFIG_LIST,
filter_dict={
"tags": ["gpt-4"],
"tags": ["gpt-4o-mini"],
},
file_location=KEY_LOC,
)
Expand Down
8 changes: 1 addition & 7 deletions test/io/test_websockets.py
Original file line number Diff line number Diff line change
Expand Up @@ -97,14 +97,8 @@ def on_connect(iostream: IOWebsockets, success_dict: Dict[str, bool] = success_d
OAI_CONFIG_LIST,
filter_dict={
"model": [
"gpt-4o-mini",
"gpt-3.5-turbo",
"gpt-3.5-turbo-16k",
"gpt-4",
"gpt-4-0314",
"gpt4",
"gpt-4-32k",
"gpt-4-32k-0314",
"gpt-4-32k-v0314",
],
},
file_location=KEY_LOC,
Expand Down
14 changes: 2 additions & 12 deletions test/oai/_test_completion.py
Original file line number Diff line number Diff line change
Expand Up @@ -143,13 +143,8 @@ def test_nocontext():
file_location=KEY_LOC,
filter_dict={
"model": {
"gpt-4o-mini",
"gpt-3.5-turbo",
"gpt-3.5-turbo-16k",
"gpt-3.5-turbo-16k-0613",
"gpt-3.5-turbo-0301",
"chatgpt-35-turbo-0301",
"gpt-35-turbo-v0301",
"gpt",
},
},
),
Expand Down Expand Up @@ -179,13 +174,8 @@ def test_humaneval(num_samples=1):
env_or_file=OAI_CONFIG_LIST,
filter_dict={
"model": {
"gpt-4o-mini",
"gpt-3.5-turbo",
"gpt-3.5-turbo-16k",
"gpt-3.5-turbo-16k-0613",
"gpt-3.5-turbo-0301",
"chatgpt-35-turbo-0301",
"gpt-35-turbo-v0301",
"gpt",
},
},
file_location=KEY_LOC,
Expand Down
2 changes: 1 addition & 1 deletion test/oai/test_client.py
Original file line number Diff line number Diff line change
Expand Up @@ -89,7 +89,7 @@ def test_aoai_chat_completion():
print(client.extract_text_or_completion_object(response))


# @pytest.mark.skipif(skip or not TOOL_ENABLED, reason="openai>=1.1.0 not installed")
@pytest.mark.skipif(skip or not TOOL_ENABLED, reason="openai>=1.1.0 not installed")
@pytest.mark.skip(reason="This test is not working until Azure settings are updated")
def test_oai_tool_calling_extraction():
config_list = config_list_from_json(
Expand Down
2 changes: 1 addition & 1 deletion test/oai/test_client_stream.py
Original file line number Diff line number Diff line change
Expand Up @@ -237,7 +237,7 @@ def test_chat_tools_stream() -> None:
config_list = config_list_from_json(
env_or_file=OAI_CONFIG_LIST,
file_location=KEY_LOC,
filter_dict={"tags": ["multitool"]},
filter_dict={"tags": ["tool"]},
)
tools = [
{
Expand Down

0 comments on commit 0448fe6

Please sign in to comment.