openai-e2e: change model

asamal4 · asamal4 · commit c2380fd9f686 · 2025-04-22T14:58:04.000+05:30
diff --git a/tests/config/operator_install/olsconfig.crd.openai_introspection.yaml b/tests/config/operator_install/olsconfig.crd.openai_introspection.yaml
@@ -15,6 +15,10 @@ spec:
           name: llmcreds
         models:
           - name: gpt-4o-mini
+          - name: gpt-4o
+          - name: gpt-4
+          - name: gpt-4-turbo
+          - name: gpt-4.1-nano
         name: openai
         type: openai
   ols:
diff --git a/tests/e2e/test_query_endpoint.py b/tests/e2e/test_query_endpoint.py
@@ -199,13 +199,117 @@ def test_too_long_question() -> None:
 @pytest.mark.introspection
 @pytest.mark.smoketest
 @pytest.mark.rag
-def test_valid_question() -> None:
+def test_valid_question_4o_mini() -> None:
     """Check the REST API /v1/query with POST HTTP method for valid question and no yaml."""
     with metrics_utils.RestAPICallCounterChecker(pytest.metrics_client, QUERY_ENDPOINT):
         cid = suid.get_suid()
         response = pytest.client.post(
             QUERY_ENDPOINT,
-            json={"conversation_id": cid, "query": "what is kubernetes?"},
+            json={
+                "conversation_id": cid,
+                "query": "what is kubernetes?",
+                "provider": "openai",
+                "model": "gpt-4o-mini",
+            },
+            timeout=test_api.LLM_REST_API_TIMEOUT,
+        )
+        assert response.status_code == requests.codes.ok
+
+        response_utils.check_content_type(response, "application/json")
+        print(vars(response))
+        json_response = response.json()
+
+        # checking a few major information from response
+        assert json_response["conversation_id"] == cid
+        assert "Kubernetes is" in json_response["response"]
+        assert re.search(
+            r"orchestration (tool|system|platform|engine)",
+            json_response["response"],
+            re.IGNORECASE,
+        )
+        assert json_response["input_tokens"] > 0
+        assert json_response["output_tokens"] > 0
+
+
+@pytest.mark.introspection
+def test_valid_question_4o() -> None:
+    """Check the REST API /v1/query with POST HTTP method for valid question and no yaml."""
+    with metrics_utils.RestAPICallCounterChecker(pytest.metrics_client, QUERY_ENDPOINT):
+        cid = suid.get_suid()
+        response = pytest.client.post(
+            QUERY_ENDPOINT,
+            json={
+                "conversation_id": cid,
+                "query": "what is kubernetes?",
+                "provider": "openai",
+                "model": "gpt-4o",
+            },
+            timeout=test_api.LLM_REST_API_TIMEOUT,
+        )
+        assert response.status_code == requests.codes.ok
+
+        response_utils.check_content_type(response, "application/json")
+        print(vars(response))
+        json_response = response.json()
+
+        # checking a few major information from response
+        assert json_response["conversation_id"] == cid
+        assert "Kubernetes is" in json_response["response"]
+        assert re.search(
+            r"orchestration (tool|system|platform|engine)",
+            json_response["response"],
+            re.IGNORECASE,
+        )
+        assert json_response["input_tokens"] > 0
+        assert json_response["output_tokens"] > 0
+
+
+@pytest.mark.introspection
+def test_valid_question_4() -> None:
+    """Check the REST API /v1/query with POST HTTP method for valid question and no yaml."""
+    with metrics_utils.RestAPICallCounterChecker(pytest.metrics_client, QUERY_ENDPOINT):
+        cid = suid.get_suid()
+        response = pytest.client.post(
+            QUERY_ENDPOINT,
+            json={
+                "conversation_id": cid,
+                "query": "what is kubernetes?",
+                "provider": "openai",
+                "model": "gpt-4",
+            },
+            timeout=test_api.LLM_REST_API_TIMEOUT,
+        )
+        assert response.status_code == requests.codes.ok
+
+        response_utils.check_content_type(response, "application/json")
+        print(vars(response))
+        json_response = response.json()
+
+        # checking a few major information from response
+        assert json_response["conversation_id"] == cid
+        assert "Kubernetes is" in json_response["response"]
+        assert re.search(
+            r"orchestration (tool|system|platform|engine)",
+            json_response["response"],
+            re.IGNORECASE,
+        )
+        assert json_response["input_tokens"] > 0
+        assert json_response["output_tokens"] > 0
+
+
+@pytest.mark.introspection
+def test_valid_question_nano() -> None:
+    """Check the REST API /v1/query with POST HTTP method for valid question and no yaml."""
+    with metrics_utils.RestAPICallCounterChecker(pytest.metrics_client, QUERY_ENDPOINT):
+        cid = suid.get_suid()
+        response = pytest.client.post(
+            QUERY_ENDPOINT,
+            json={
+                "conversation_id": cid,
+                "query": "what is kubernetes?",
+                "provider": "openai",
+                "model": "gpt-4.1-nano",
+            },
             timeout=test_api.LLM_REST_API_TIMEOUT,
         )
         assert response.status_code == requests.codes.ok
@@ -348,7 +452,6 @@ def test_token_counters_for_query_call_with_improper_payload() -> None:
 
 @pytest.mark.introspection
 @pytest.mark.rag
-@retry(max_attempts=3, wait_between_runs=10)
 def test_rag_question() -> None:
     """Ensure responses include rag references."""
     with metrics_utils.RestAPICallCounterChecker(pytest.metrics_client, QUERY_ENDPOINT):
@@ -585,8 +688,94 @@ def test_query_with_unknown_model() -> None:
 
 
 @pytest.mark.introspection
-@retry(max_attempts=3, wait_between_runs=10)
-def test_tool_calling() -> None:
+def test_tool_calling_4o_mini() -> None:
+    """Check the REST API /v1/query with POST HTTP method for tool calling."""
+    with metrics_utils.RestAPICallCounterChecker(pytest.metrics_client, QUERY_ENDPOINT):
+        cid = suid.get_suid()
+        response = pytest.client.post(
+            QUERY_ENDPOINT,
+            json={
+                "conversation_id": cid,
+                "query": "show me pods in openshift-lightspeed namespace",
+                "provider": "openai",
+                "model": "gpt-4o-mini",
+            },
+            timeout=test_api.LLM_REST_API_TIMEOUT,
+        )
+        assert response.status_code == requests.codes.ok
+
+        response_utils.check_content_type(response, "application/json")
+        print(vars(response))
+        json_response = response.json()
+
+        # checking a few major information from response
+        assert json_response["conversation_id"] == cid
+
+        assert "lightspeed-app-server" in json_response["response"].lower()
+        assert json_response["input_tokens"] > 0
+        assert json_response["output_tokens"] > 0
+
+
+@pytest.mark.introspection
+def test_tool_calling_4o() -> None:
+    """Check the REST API /v1/query with POST HTTP method for tool calling."""
+    with metrics_utils.RestAPICallCounterChecker(pytest.metrics_client, QUERY_ENDPOINT):
+        cid = suid.get_suid()
+        response = pytest.client.post(
+            QUERY_ENDPOINT,
+            json={
+                "conversation_id": cid,
+                "query": "show me pods in openshift-lightspeed namespace",
+                "provider": "openai",
+                "model": "gpt-4o",
+            },
+            timeout=test_api.LLM_REST_API_TIMEOUT,
+        )
+        assert response.status_code == requests.codes.ok
+
+        response_utils.check_content_type(response, "application/json")
+        print(vars(response))
+        json_response = response.json()
+
+        # checking a few major information from response
+        assert json_response["conversation_id"] == cid
+
+        assert "lightspeed-app-server" in json_response["response"].lower()
+        assert json_response["input_tokens"] > 0
+        assert json_response["output_tokens"] > 0
+
+
+@pytest.mark.introspection
+def test_tool_calling_4() -> None:
+    """Check the REST API /v1/query with POST HTTP method for tool calling."""
+    with metrics_utils.RestAPICallCounterChecker(pytest.metrics_client, QUERY_ENDPOINT):
+        cid = suid.get_suid()
+        response = pytest.client.post(
+            QUERY_ENDPOINT,
+            json={
+                "conversation_id": cid,
+                "query": "show me pods in openshift-lightspeed namespace",
+                "provider": "openai",
+                "model": "gpt-4",
+            },
+            timeout=test_api.LLM_REST_API_TIMEOUT,
+        )
+        assert response.status_code == requests.codes.ok
+
+        response_utils.check_content_type(response, "application/json")
+        print(vars(response))
+        json_response = response.json()
+
+        # checking a few major information from response
+        assert json_response["conversation_id"] == cid
+
+        assert "lightspeed-app-server" in json_response["response"].lower()
+        assert json_response["input_tokens"] > 0
+        assert json_response["output_tokens"] > 0
+
+
+@pytest.mark.introspection
+def test_tool_calling_nano() -> None:
     """Check the REST API /v1/query with POST HTTP method for tool calling."""
     with metrics_utils.RestAPICallCounterChecker(pytest.metrics_client, QUERY_ENDPOINT):
         cid = suid.get_suid()
@@ -595,6 +784,8 @@ def test_tool_calling() -> None:
             json={
                 "conversation_id": cid,
                 "query": "show me pods in openshift-lightspeed namespace",
+                "provider": "openai",
+                "model": "gpt-4.1-nano",
             },
             timeout=test_api.LLM_REST_API_TIMEOUT,
         )
diff --git a/tests/scripts/test-e2e-cluster.sh b/tests/scripts/test-e2e-cluster.sh
@@ -37,35 +37,35 @@ function run_suites() {
   # runsuite arguments:
   # suiteid test_tags provider provider_keypath model ols_image
   # empty test_tags means run all tests
-  run_suite "azure_openai" "not certificates and not (introspection and not smoketest and not rag)" "azure_openai" "$AZUREOPENAI_PROVIDER_KEY_PATH" "gpt-4o-mini" "$OLS_IMAGE" "n"
-  (( rc = rc || $? ))
-
-  # # BAM is currently not working, commenting for now
-  # run_suite "bam" "not azure_entra_id and not certificates and not (introspection and not smoketest and not rag)" "bam" "$BAM_PROVIDER_KEY_PATH" "ibm/granite-3-8b-instruct" "$OLS_IMAGE" "n"
+  # run_suite "azure_openai" "not certificates and not (introspection and not smoketest and not rag)" "azure_openai" "$AZUREOPENAI_PROVIDER_KEY_PATH" "gpt-4o-mini" "$OLS_IMAGE" "n"
   # (( rc = rc || $? ))
 
-  run_suite "openai" "not azure_entra_id and not certificates and not (introspection and not smoketest and not rag)" "openai" "$OPENAI_PROVIDER_KEY_PATH" "gpt-4o-mini" "$OLS_IMAGE" "n"
-  (( rc = rc || $? ))
+  # # # BAM is currently not working, commenting for now
+  # # run_suite "bam" "not azure_entra_id and not certificates and not (introspection and not smoketest and not rag)" "bam" "$BAM_PROVIDER_KEY_PATH" "ibm/granite-3-8b-instruct" "$OLS_IMAGE" "n"
+  # # (( rc = rc || $? ))
 
-  run_suite "watsonx" "not azure_entra_id and not certificates and not (introspection and not smoketest and not rag)" "watsonx" "$WATSONX_PROVIDER_KEY_PATH" "ibm/granite-3-8b-instruct" "$OLS_IMAGE" "n"
-  (( rc = rc || $? ))
+  # run_suite "openai" "not azure_entra_id and not certificates and not (introspection and not smoketest and not rag)" "openai" "$OPENAI_PROVIDER_KEY_PATH" "gpt-4o-mini" "$OLS_IMAGE" "n"
+  # (( rc = rc || $? ))
 
-  # smoke tests for RHOAI VLLM-compatible provider
-  run_suite "rhoai_vllm" "smoketest" "rhoai_vllm" "$OPENAI_PROVIDER_KEY_PATH" "gpt-3.5-turbo" "$OLS_IMAGE" "n"
-  (( rc = rc || $? ))
+  # run_suite "watsonx" "not azure_entra_id and not certificates and not (introspection and not smoketest and not rag)" "watsonx" "$WATSONX_PROVIDER_KEY_PATH" "ibm/granite-3-8b-instruct" "$OLS_IMAGE" "n"
+  # (( rc = rc || $? ))
 
-  # smoke tests for RHELAI VLLM-compatible provider
-  run_suite "rhelai_vllm" "smoketest" "rhelai_vllm" "$OPENAI_PROVIDER_KEY_PATH" "gpt-3.5-turbo" "$OLS_IMAGE" "n"
-  (( rc = rc || $? ))
+  # # smoke tests for RHOAI VLLM-compatible provider
+  # run_suite "rhoai_vllm" "smoketest" "rhoai_vllm" "$OPENAI_PROVIDER_KEY_PATH" "gpt-3.5-turbo" "$OLS_IMAGE" "n"
+  # (( rc = rc || $? ))
+
+  # # smoke tests for RHELAI VLLM-compatible provider
+  # run_suite "rhelai_vllm" "smoketest" "rhelai_vllm" "$OPENAI_PROVIDER_KEY_PATH" "gpt-3.5-turbo" "$OLS_IMAGE" "n"
+  # (( rc = rc || $? ))
 
   # TODO: Reduce execution time. Sequential execution will take more time. Parallel execution will have cluster claim issue.
   # Run tool calling - Enable introspection
-  run_suite "azure_openai_introspection" "introspection" "azure_openai" "$AZUREOPENAI_PROVIDER_KEY_PATH" "gpt-4o-mini" "$OLS_IMAGE" "y"
-  (( rc = rc || $? ))
+  # run_suite "azure_openai_introspection" "introspection" "azure_openai" "$AZUREOPENAI_PROVIDER_KEY_PATH" "gpt-4o-mini" "$OLS_IMAGE" "y"
+  # (( rc = rc || $? ))
   run_suite "openai_introspection" "introspection" "openai" "$OPENAI_PROVIDER_KEY_PATH" "gpt-4o-mini" "$OLS_IMAGE" "y"
   (( rc = rc || $? ))
-  run_suite "watsonx_introspection" "introspection" "watsonx" "$WATSONX_PROVIDER_KEY_PATH" "ibm/granite-3-2-8b-instruct" "$OLS_IMAGE" "y"
-  (( rc = rc || $? ))
+  # run_suite "watsonx_introspection" "introspection" "watsonx" "$WATSONX_PROVIDER_KEY_PATH" "ibm/granite-3-2-8b-instruct" "$OLS_IMAGE" "y"
+  # (( rc = rc || $? ))
 
   set -e