python/embed4all: use gguf model, allow passing kwargs/overriding model

2024-10-01 01:06:10 -04:00 · 2023-10-05 12:09:14 -07:00 · 2023-10-05 12:09:14 -07:00 · a10f3aea5e
commit a10f3aea5e
parent 8bb6a6c201
1 changed files with 2 additions and 6 deletions
--- a/gpt4all-bindings/python/gpt4all/gpt4all.py
+++ b/gpt4all-bindings/python/gpt4all/gpt4all.py
@ -30,17 +30,14 @@ class Embed4All:
    Python class that handles embeddings for GPT4All.
    """

-    def __init__(
-        self,
-        n_threads: Optional[int] = None,
-    ):
+    def __init__(self, model_name: Optional[str] = None, n_threads: Optional[int] = None, **kwargs):
        """
        Constructor

        Args:
            n_threads: number of CPU threads used by GPT4All. Default is None, then the number of threads are determined automatically.
        """
-        self.gpt4all = GPT4All(model_name='ggml-all-MiniLM-L6-v2-f16.bin', n_threads=n_threads)
+        self.gpt4all = GPT4All(model_name or 'ggml-all-MiniLM-L6-v2-f16.gguf', n_threads=n_threads, **kwargs)

    def embed(self, text: str) -> List[float]:
        """
@ -315,7 +312,6 @@ class GPT4All:
            callback: pyllmodel.ResponseCallbackType,
            output_collector: List[MessageType],
        ) -> pyllmodel.ResponseCallbackType:
-
            def _callback(token_id: int, response: str) -> bool:
                nonlocal callback, output_collector