ollama Interface: comparison OllamaInterface/OllamaClient.py

-:7dd1b9cd3150
+:6e8af43d537d
 class OllamaClient(QObject):
 """
 Class implementing the 'ollama' client.
-@signal replyReceived(content:str, role:str) emitted after a response from the
+@signal replyReceived(content:str, role:str, done:bool) emitted after a response
-'ollama' server was received
+from the 'ollama' server was received
 @signal modelsList(modelNames:list[str]) emitted after the list of model
 names was obtained from the 'ollama' server
 @signal detailedModelsList(models:list[dict]) emitted after the list of
 models was obtained from the 'ollama' server giving some model details
 @signal runningModelsList(models:list[dict]) emitted after the list of
 while processing the request
 @signal serverStateChanged(ok:bool) emitted to indicate a change of the server
 responsiveness
 """
-replyReceived = pyqtSignal(str, str)
+replyReceived = pyqtSignal(str, str, bool)
 modelsList = pyqtSignal(list)
 detailedModelsList = pyqtSignal(list)
 runningModelsList = pyqtSignal(list)
 pullStatus = pyqtSignal(str, str, int, int)
 serverVersion = pyqtSignal(str)
 self.__serverResponding = False  # start with a faulty state
 self.__plugin.preferencesChanged.connect(self.__setHeartbeatTimer)
 self.__setHeartbeatTimer()
-def chat(self, model, messages):
+def chat(self, model, messages, streaming=True):
 """
 Public method to request a chat completion from the 'ollama' server.
 @param model name of the model to be used
 @type str
 @param messages list of message objects
 @type list of dict
-"""
+@param streaming flag indicating to receive a streaming response
-# TODO: not implemented yet
+@type bool
+"""
 ollamaRequest = {
 "model": model,
 "messages": messages,
+"stream": streaming,
 }
 self.__sendRequest(
 "chat", data=ollamaRequest, processResponse=self.__processChatResponse
 )
 @param response dictionary containing the chat response
 @type dict
 """
 with contextlib.suppress(KeyError):
 message = response["message"]
+done = response["done"]
 if message:
-self.replyReceived.emit(message["content"], message["role"])
+self.replyReceived.emit(message["content"], message["role"], done)
 def generate(self, model, prompt, suffix=None):
 """
 Public method to request to generate a completion from the 'ollama' server.
 @param prompt prompt to generate a response for
 @type str
 @param suffix text after the model response (defaults to None)
 @type str (optional)
 """
-# TODO: not implemented yet
 ollamaRequest = {
 "model": model,
 "prompt": prompt,
 }
 if suffix is not None:
 @param response dictionary containing the generate response
 @type dict
 """
 with contextlib.suppress(KeyError):
-self.replyReceived.emit(response["response"], "")
+self.replyReceived.emit(response["response"], "", response["done"])
 def pull(self, model):
 """
 Public method to ask the 'ollama' server to pull the given model.

Mercurial Repositories > ollama Interface / file comparison

comparison: OllamaInterface/OllamaClient.py

OllamaInterface/OllamaClient.py