From c6aee7e67139d6ad04ff164f286335377dd9fbdc Mon Sep 17 00:00:00 2001 From: Saifeddine ALOUI Date: Sun, 11 Feb 2024 15:56:20 +0100 Subject: [PATCH] Added /chat endpoint to the queued services --- ollama_proxy_server/main.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ollama_proxy_server/main.py b/ollama_proxy_server/main.py index 76f638b..894e729 100644 --- a/ollama_proxy_server/main.py +++ b/ollama_proxy_server/main.py @@ -139,7 +139,7 @@ def main(): min_queued_server = server # Apply the queuing mechanism only for a specific endpoint. - if path == '/api/generate': + if path == '/api/generate' or path == '/api/chat': que = min_queued_server[1]['queue'] client_ip, client_port = self.client_address self.add_access_log_entry(event="gen_request", user=self.user, ip_address=client_ip, access="Authorized", server=min_queued_server[0], nb_queued_requests_on_server=que.qsize())