Only tool relevant tests

2024-09-30 22:24:20 +02:00
parent 8082b3651a
commit b430d318bb
1 changed files with 17 additions and 17 deletions
--- a/suite_settings/tests.py
+++ b/suite_settings/tests.py
@@ -6,24 +6,24 @@ from textwrap import dedent
 from langchain_core.messages import HumanMessage, SystemMessage, ToolMessage, AIMessage

 tests = {
-    607: Test(
-        name="Healthy Vegetables in Chinese",
-        runnable=basic_prompt,
-        runnable_input={
-            "system_msg": "You are a helpful assistant. You serve people across the globe.",
-            "human_msg": "什么蔬菜最健康？",
-        },
-        validator=system_human_answer_match,
-        validation_input={
-            "criteria": dedent("""- in Mandarin Chinese from front to finnish
-            - factually correct
-            - about healthy vegetables
-            - just one single conversational answer, without any AI fragments (A/B versions, "end of message" parts, unfitting discalimers or notes)
+    # 607: Test(
+    #     name="Healthy Vegetables in Chinese",
+    #     runnable=basic_prompt,
+    #     runnable_input={
+    #         "system_msg": "You are a helpful assistant. You serve people across the globe.",
+    #         "human_msg": "什么蔬菜最健康？",
+    #     },
+    #     validator=system_human_answer_match,
+    #     validation_input={
+    #         "criteria": dedent("""- in Mandarin Chinese from front to finnish
+    #         - factually correct
+    #         - about healthy vegetables
+    #         - just one single conversational answer, without any AI fragments (A/B versions, "end of message" parts, unfitting discalimers or notes)

-            Again, the message has to be entirely in Manadarin Chineese.
-            That means If the answer is not in Chinese the answer is NOT correct! Only if the message in in Chinese rate as correct"""),
-        },
-    ),
+    #         Again, the message has to be entirely in Manadarin Chineese.
+    #         That means If the answer is not in Chinese the answer is NOT correct! Only if the message in in Chinese rate as correct"""),
+    #     },
+    # ),
    693: Test(
        name="Simple Multiplication",
        runnable=one_tool_call_answer,