From 4413881b2d593a406021616953e46ce7b6153c9d Mon Sep 17 00:00:00 2001 From: Benson Wong Date: Thu, 1 Jan 2026 13:35:45 -0800 Subject: [PATCH] proxy: actually add /v1/responses endpoint (#449) ref: #448 --- proxy/proxymanager.go | 1 + 1 file changed, 1 insertion(+) diff --git a/proxy/proxymanager.go b/proxy/proxymanager.go index f94ba408..687e83c5 100644 --- a/proxy/proxymanager.go +++ b/proxy/proxymanager.go @@ -277,6 +277,7 @@ func (pm *ProxyManager) setupGinEngine() { // Set up routes using the Gin engine // Protected routes use pm.apiKeyAuth() middleware pm.ginEngine.POST("/v1/chat/completions", pm.apiKeyAuth(), pm.proxyInferenceHandler) + pm.ginEngine.POST("/v1/responses", pm.apiKeyAuth(), pm.proxyInferenceHandler) // Support legacy /v1/completions api, see issue #12 pm.ginEngine.POST("/v1/completions", pm.apiKeyAuth(), pm.proxyInferenceHandler) // Support anthropic /v1/messages (added https://github.com/ggml-org/llama.cpp/pull/17570)