~ | support local llm inference

2024-03-11 18:31:13 +00:00 · 2024-03-11 18:31:13 +00:00 · 479ef89f4c
parent b7342b1f13
commit 479ef89f4c
1 changed files with 5 additions and 68 deletions
--- a/g4f/local/init.py
+++ b/g4f/local/init.py
@ -1,75 +1,13 @@
-import random, string, time, re
-
 from ..typing import Union, Iterator, Messages
 from ..stubs  import ChatCompletion, ChatCompletionChunk
 from .core.engine import LocalProvider
 from .core.models import models
-
-IterResponse = Iterator[Union[ChatCompletion, ChatCompletionChunk]]
-
-def read_json(text: str) -> dict:
-    match = re.search(r"```(json|)\n(?P<code>[\S\s]+?)\n```", text)
-    if match:
-        return match.group("code")
-    return text
-
-def iter_response(
-    response: Iterator[str],
-    stream: bool,
-    response_format: dict = None,
-    max_tokens: int = None,
-    stop: list = None
-) -> IterResponse:
-    
-    content = ""
-    finish_reason = None
-    completion_id = ''.join(random.choices(string.ascii_letters + string.digits, k=28))
-    for idx, chunk in enumerate(response):
-        content += str(chunk)
-        if max_tokens is not None and idx + 1 >= max_tokens:
-            finish_reason = "length"
-        first = -1
-        word = None
-        if stop is not None:
-            for word in list(stop):
-                first = content.find(word)
-                if first != -1:
-                    content = content[:first]
-                    break
-            if stream and first != -1:
-                first = chunk.find(word)
-                if first != -1:
-                    chunk = chunk[:first]
-                else:
-                    first = 0
-        if first != -1:
-            finish_reason = "stop"
-        if stream:
-            yield ChatCompletionChunk(chunk, None, completion_id, int(time.time()))
-        if finish_reason is not None:
-            break
-    finish_reason = "stop" if finish_reason is None else finish_reason
-    if stream:
-        yield ChatCompletionChunk(None, finish_reason, completion_id, int(time.time()))
-    else:
-        if response_format is not None and "type" in response_format:
-            if response_format["type"] == "json_object":
-                content = read_json(content)
-        yield ChatCompletion(content, finish_reason, completion_id, int(time.time()))
-
-def filter_none(**kwargs):
-    for key in list(kwargs.keys()):
-        if kwargs[key] is None:
-            del kwargs[key]
-    return kwargs
+from ..client     import iter_response, filter_none, IterResponse

 class LocalClient():
-    def __init__(
-        self,
-        **kwargs
-    ) -> None:
+    def __init__(self, **kwargs) -> None:
        self.chat: Chat = Chat(self)
-        
+    
    @staticmethod
    def list_models():
        return list(models.keys())
@ -100,10 +38,9 @@ class Completions():
        )
        response = iter_response(response, stream, response_format, max_tokens, stop)
        return response if stream else next(response)
-    
+
 class Chat():
    completions: Completions

    def __init__(self, client: LocalClient):
-        self.completions = Completions(client)
-    
+        self.completions = Completions(client)