IBM vLLM 배포형 채팅 요청 스키마 분기와 문서 반영

IBM/CP4D 인증을 사용하는 vLLM 등록 모델에서 배포형 /ml/v1/deployments/.../text/chat 계열 엔드포인트를 감지하도록 정리했다. 일반 OpenAI 호환 body 대신 messages+parameters 형태의 IBM deployment chat body를 사용하고 /v1/chat/completions를 강제로 붙이지 않도록 수정했다. IBM 배포형 응답은 results.generated_text, output_text, choices.message.content를 함께 파싱하도록 보강했고 도구 호출 경로는 안전하게 일반 응답 폴백을 유도하도록 정리했다. README와 DEVELOPMENT 문서를 2026-04-06 18:02 (KST) 기준으로 갱신했고 dotnet build 검증에서 경고 0 / 오류 0을 확인했다.
2026-04-06 17:49:48 +09:00
parent e439fd144e
commit 606ecbe6cd
4 changed files with 170 additions and 10 deletions
--- a/src/AxCopilot/Services/LlmService.ToolUse.cs
+++ b/src/AxCopilot/Services/LlmService.ToolUse.cs
@@ -431,13 +431,20 @@ public partial class LlmService
        List<ChatMessage> messages, IReadOnlyCollection<IAgentTool> tools, CancellationToken ct)
    {
        var activeService = ResolveService();
-        var body = BuildOpenAiToolBody(messages, tools);

        // 등록 모델의 커스텀 엔드포인트 우선 사용 (ResolveServerInfo)
        var (resolvedEp, _, allowInsecureTls) = ResolveServerInfo();
        var endpoint = string.IsNullOrEmpty(resolvedEp)
            ? ResolveEndpointForService(activeService)
            : resolvedEp;
+        var registered = GetActiveRegisteredModel();
+        if (UsesIbmDeploymentChatApi(activeService, registered, endpoint))
+        {
+            throw new ToolCallNotSupportedException(
+                "IBM 배포형 vLLM 연결은 OpenAI 도구 호출 형식과 다를 수 있어 일반 대화 경로로 폴백합니다.");
+        }
+
+        var body = BuildOpenAiToolBody(messages, tools);

        var url = activeService.ToLowerInvariant() == "ollama"
            ? endpoint.TrimEnd('/') + "/api/chat"