openvinotoolkit · michalkulakowski · May 19, 2026 · Apr 30, 2026 · May 13, 2026 · May 13, 2026
diff --git a/demos/continuous_batching/README.md b/demos/continuous_batching/README.md
@@ -156,7 +156,7 @@ curl -s http://localhost:8000/v3/chat/completions -H "Content-Type: application/
 curl http://localhost:8000/v3/responses \
   -H "Content-Type: application/json" \
   -d '{
-    "model": "meta-llama/Meta-Llama-3-8B-Instruct",
+    "model": "Qwen3-30B-A3B-Instruct-2507-int4-ov",
     "max_output_tokens":30,
     "input": "What is OpenVINO?"
   }'| jq .
@@ -169,12 +169,12 @@ Windows Powershell
 (Invoke-WebRequest -Uri "http://localhost:8000/v3/responses" `
  -Method POST `
  -Headers @{ "Content-Type" = "application/json" } `
- -Body '{"model": "meta-llama/Meta-Llama-3-8B-Instruct", "max_output_tokens": 30, "input": "What is OpenVINO?"}').Content
+ -Body '{"model": "Qwen3-30B-A3B-Instruct-2507-int4-ov", "max_output_tokens": 30, "input": "What is OpenVINO?"}').Content
 ```
 
 Windows Command Prompt
 ```bat
-curl -s http://localhost:8000/v3/responses -H "Content-Type: application/json" -d "{\"model\": \"meta-llama/Meta-Llama-3-8B-Instruct\", \"max_output_tokens\": 30, \"input\": \"What is OpenVINO?\"}"
+curl -s http://localhost:8000/v3/responses -H "Content-Type: application/json" -d "{\"model\": \"Qwen3-30B-A3B-Instruct-2507-int4-ov\", \"max_output_tokens\": 30, \"input\": \"What is OpenVINO?\"}"
 ```
 :::
 
@@ -186,7 +186,7 @@ curl -s http://localhost:8000/v3/responses -H "Content-Type: application/json" -
   "id": "resp-1724405400",
   "object": "response",
   "created_at": 1724405400,
-  "model": "meta-llama/Meta-Llama-3-8B-Instruct",
+  "model": "Qwen3-30B-A3B-Instruct-2507-int4-ov",
   "status": "completed",
   "output": [
     {
@@ -337,7 +337,7 @@ client = OpenAI(
 )
 
 stream = client.responses.create(
-    model="meta-llama/Meta-Llama-3-8B-Instruct",
+    model="Qwen3-30B-A3B-Instruct-2507-int4-ov",
     input="Say this is a test",
     stream=True,
 )

diff --git a/src/llm/apis/openai_api_handler.cpp b/src/llm/apis/openai_api_handler.cpp
@@ -213,10 +213,8 @@ absl::StatusOr<ov::Tensor> loadImage(const std::string& imageSource,
         try {
             tensor = loadImageStbiFromMemory(decoded);
         } catch (std::runtime_error& e) {
-            std::stringstream ss;
-            ss << "Image parsing failed: " << e.what();
-            SPDLOG_LOGGER_DEBUG(llm_calculator_logger, ss.str());
-            return absl::InvalidArgumentError(ss.str());
+            SPDLOG_LOGGER_DEBUG(llm_calculator_logger, "Image parsing failed: {}", e.what());
+            return absl::InvalidArgumentError("Image parsing failed");
         }
     } else if (std::regex_match(imageSource.c_str(), std::regex("^(http|https|ftp|sftp|)://(.*)"))) {
         SPDLOG_LOGGER_TRACE(llm_calculator_logger, "Loading image using curl");
@@ -230,9 +228,7 @@ absl::StatusOr<ov::Tensor> loadImage(const std::string& imageSource,
         try {
             tensor = loadImageStbiFromMemory(decoded);
         } catch (std::runtime_error& e) {
-            std::stringstream ss;
-            ss << "Image parsing failed: " << e.what();
-            SPDLOG_LOGGER_DEBUG(llm_calculator_logger, ss.str());
+            SPDLOG_LOGGER_DEBUG(llm_calculator_logger, "Image parsing failed: {}", e.what());
             return absl::InvalidArgumentError("Image parsing failed");
         }
     } else {
@@ -255,10 +251,8 @@ absl::StatusOr<ov::Tensor> loadImage(const std::string& imageSource,
         try {
             tensor = loadImageStbiFromFile(resolvedImagePathStr.c_str());
         } catch (std::runtime_error& e) {
-            std::stringstream ss;
-            ss << "Image file " << resolvedImagePathStr << " parsing failed: " << e.what();
-            SPDLOG_LOGGER_DEBUG(llm_calculator_logger, ss.str());
-            return absl::InvalidArgumentError(ss.str());
+            SPDLOG_LOGGER_DEBUG(llm_calculator_logger, "Image file {} parsing failed: {}", resolvedImagePathStr, e.what());
+            return absl::InvalidArgumentError("Image file parsing failed");
         }
     }
     return tensor;