diff --git a/pkg/server/handlers_backends.go b/pkg/server/handlers_backends.go index 9ff20b5..d3132af 100644 --- a/pkg/server/handlers_backends.go +++ b/pkg/server/handlers_backends.go @@ -94,9 +94,6 @@ func (h *Handler) LlamaCppProxy(onDemandStart bool) http.HandlerFunc { r.URL.Path = strings.TrimPrefix(r.URL.Path, prefix) } - // Update the last request time for the instance - inst.UpdateLastRequestTime() - proxy.ServeHTTP(w, r) } } diff --git a/pkg/server/handlers_instances.go b/pkg/server/handlers_instances.go index 10b88d7..7a444d0 100644 --- a/pkg/server/handlers_instances.go +++ b/pkg/server/handlers_instances.go @@ -392,9 +392,6 @@ func (h *Handler) ProxyToInstance() http.HandlerFunc { r.URL.Path = strings.TrimPrefix(r.URL.Path, prefix) } - // Update the last request time for the instance - inst.UpdateLastRequestTime() - // Set forwarded headers r.Header.Set("X-Forwarded-Host", r.Header.Get("Host")) r.Header.Set("X-Forwarded-Proto", "http") diff --git a/pkg/server/handlers_openai.go b/pkg/server/handlers_openai.go index fd9b818..9ad3207 100644 --- a/pkg/server/handlers_openai.go +++ b/pkg/server/handlers_openai.go @@ -136,9 +136,6 @@ func (h *Handler) OpenAIProxy() http.HandlerFunc { return } - // Update last request time for the instance - inst.UpdateLastRequestTime() - // Recreate the request body from the bytes we read r.Body = io.NopCloser(bytes.NewReader(bodyBytes)) r.ContentLength = int64(len(bodyBytes))