[misc] fix accelerator (#9661)

Co-authored-by: gemini-code-assist[bot] <176961590+gemini-code-assist[bot]@users.noreply.github.com>
2026-02-26 15:56:00 +08:00 · 2025-12-25 02:11:04 +08:00
parent 6a2eafbae3
commit a754604c11
44 changed files with 396 additions and 448 deletions
--- a/tests/e2e/test_chat.py
+++ b/tests/e2e/test_chat.py
@@ -37,13 +37,13 @@ MESSAGES = [
 EXPECTED_RESPONSE = "_rho"


-@pytest.mark.runs_on(["cpu"])
+@pytest.mark.runs_on(["cpu", "mps"])
 def test_chat():
    chat_model = ChatModel(INFER_ARGS)
    assert chat_model.chat(MESSAGES)[0].response_text == EXPECTED_RESPONSE


-@pytest.mark.runs_on(["cpu"])
+@pytest.mark.runs_on(["cpu", "mps"])
 def test_stream_chat():
    chat_model = ChatModel(INFER_ARGS)
    response = ""
--- a/tests/e2e/test_sglang.py
+++ b/tests/e2e/test_sglang.py
@@ -39,7 +39,7 @@ MESSAGES = [
 ]


-@pytest.mark.runs_on(["cpu"])
+@pytest.mark.runs_on(["cuda"])
@pytest.mark.skipif(not is_sglang_available(), reason="SGLang is not installed")
 def test_chat():
    r"""Test the SGLang engine's basic chat functionality."""
@@ -49,7 +49,7 @@ def test_chat():
    print(response.response_text)


-@pytest.mark.runs_on(["cpu"])
+@pytest.mark.runs_on(["cuda"])
@pytest.mark.skipif(not is_sglang_available(), reason="SGLang is not installed")
 def test_stream_chat():
    r"""Test the SGLang engine's streaming chat functionality."""
--- a/tests/e2e/test_train.py
+++ b/tests/e2e/test_train.py
@@ -49,7 +49,7 @@ INFER_ARGS = {
 OS_NAME = os.getenv("OS_NAME", "")


-@pytest.mark.runs_on(["cpu"])
+@pytest.mark.runs_on(["cpu", "mps"])
@pytest.mark.parametrize(
    "stage,dataset",
    [
@@ -66,7 +66,7 @@ def test_run_exp(stage: str, dataset: str):
    assert os.path.exists(output_dir)


-@pytest.mark.runs_on(["cpu"])
+@pytest.mark.runs_on(["cpu", "mps"])
 def test_export():
    export_dir = os.path.join("output", "llama3_export")
    export_model({"export_dir": export_dir, **INFER_ARGS})