gpt4all/gpt4all-bindings/cli/app.py

#!/usr/bin/env python3
"""GPT4All CLI

The GPT4All CLI is a self-contained script based on the `gpt4all` and `typer` packages. It offers a
REPL to communicate with a language model similar to the chat GUI application, but more basic.
"""

import importlib.metadata
import io
import sys
from collections import namedtuple
from typing_extensions import Annotated

import typer
from gpt4all import GPT4All


MESSAGES = [
    {"role": "system", "content": "You are a helpful assistant."},
    {"role": "user", "content": "Hello there."},
    {"role": "assistant", "content": "Hi, how can I help you?"},
]

SPECIAL_COMMANDS = {
    "/reset": lambda messages: messages.clear(),
    "/exit": lambda _: sys.exit(),
    "/clear": lambda _: print("\n" * 100),
    "/help": lambda _: print("Special commands: /reset, /exit, /help and /clear"),
}

VersionInfo = namedtuple('VersionInfo', ['major', 'minor', 'micro'])
VERSION_INFO = VersionInfo(1, 0, 2)
VERSION = '.'.join(map(str, VERSION_INFO))  # convert to string form, like: '1.2.3'

CLI_START_MESSAGE = f"""
    
 ██████  ██████  ████████ ██   ██  █████  ██      ██      
██       ██   ██    ██    ██   ██ ██   ██ ██      ██      
██   ███ ██████     ██    ███████ ███████ ██      ██      
██    ██ ██         ██         ██ ██   ██ ██      ██      
 ██████  ██         ██         ██ ██   ██ ███████ ███████ 
                                                          

Welcome to the GPT4All CLI! Version {VERSION}
Type /help for special commands.
                                                    
"""

# create typer app
app = typer.Typer()

@app.command()
def repl(
    model: Annotated[
        str,
        typer.Option("--model", "-m", help="Model to use for chatbot"),
    ] = "mistral-7b-instruct-v0.1.Q4_0.gguf",
    n_threads: Annotated[
        int,
        typer.Option("--n-threads", "-t", help="Number of threads to use for chatbot"),
    ] = None,
    device: Annotated[
        str,
        typer.Option("--device", "-d", help="Device to use for chatbot, e.g. gpu, amd, nvidia, intel. Defaults to CPU."),
    ] = None,
):
    """The CLI read-eval-print loop."""
    gpt4all_instance = GPT4All(model, device=device)

    # if threads are passed, set them
    if n_threads is not None:
        num_threads = gpt4all_instance.model.thread_count()
        print(f"\nAdjusted: {num_threads} →", end="")

        # set number of threads
        gpt4all_instance.model.set_thread_count(n_threads)

        num_threads = gpt4all_instance.model.thread_count()
        print(f" {num_threads} threads", end="", flush=True)
    else:
        print(f"\nUsing {gpt4all_instance.model.thread_count()} threads", end="")

    print(CLI_START_MESSAGE)

    use_new_loop = False
    try:
        version = importlib.metadata.version('gpt4all')
        version_major = int(version.split('.')[0])
        if version_major >= 1:
            use_new_loop = True
    except:
        pass  # fall back to old loop
    if use_new_loop:
        _new_loop(gpt4all_instance)
    else:
        _old_loop(gpt4all_instance)


def _old_loop(gpt4all_instance):
    while True:
        message = input(" ⇢  ")

        # Check if special command and take action
        if message in SPECIAL_COMMANDS:
            SPECIAL_COMMANDS[message](MESSAGES)
            continue

        # if regular message, append to messages
        MESSAGES.append({"role": "user", "content": message})

        # execute chat completion and ignore the full response since 
        # we are outputting it incrementally
        full_response = gpt4all_instance.chat_completion(
            MESSAGES,
            # preferential kwargs for chat ux
            logits_size=0,
            tokens_size=0,
            n_past=0,
            n_ctx=0,
            n_predict=200,
            top_k=40,
            top_p=0.9,
            temp=0.9,
            n_batch=9,
            repeat_penalty=1.1,
            repeat_last_n=64,
            context_erase=0.0,
            # required kwargs for cli ux (incremental response)
            verbose=False,
            streaming=True,
        )
        # record assistant's response to messages
        MESSAGES.append(full_response.get("choices")[0].get("message"))
        print() # newline before next prompt


def _new_loop(gpt4all_instance):
    with gpt4all_instance.chat_session():
        while True:
            message = input(" ⇢  ")

            # Check if special command and take action
            if message in SPECIAL_COMMANDS:
                SPECIAL_COMMANDS[message](MESSAGES)
                continue

            # if regular message, append to messages
            MESSAGES.append({"role": "user", "content": message})

            # execute chat completion and ignore the full response since 
            # we are outputting it incrementally
            response_generator = gpt4all_instance.generate(
                message,
                # preferential kwargs for chat ux
                max_tokens=200,
                temp=0.9,
                top_k=40,
                top_p=0.9,
                repeat_penalty=1.1,
                repeat_last_n=64,
                n_batch=9,
                # required kwargs for cli ux (incremental response)
                streaming=True,
            )
            response = io.StringIO()
            for token in response_generator:
                print(token, end='', flush=True)
                response.write(token)

            # record assistant's response to messages
            response_message = {'role': 'assistant', 'content': response.getvalue()}
            response.close()
            gpt4all_instance.current_chat_session.append(response_message)
            MESSAGES.append(response_message)
            print() # newline before next prompt


@app.command()
def version():
    """The CLI version command."""
    print(f"gpt4all-cli v{VERSION}")


if __name__ == "__main__":
    app()
make scripts executable (#1555) 2023-10-24 09:28:21 -04:00			`#!/usr/bin/env python3`
CLI Improvements (#1021) * Add gpt4all-bindings/cli/README.md * Unify version information - Was previously split; base one on the other - Add VERSION_INFO as the "source of truth": - Modelled after sys.version_info. - Implemented as a tuple, because it's much easier for (partial) programmatic comparison. - Previous API is kept intact. * Add gpt4all-bindings/cli/developer_notes.md - A few notes on what's what, especially regarding docs * Add gpt4all-bindings/python/docs/gpt4all_cli.md - The CLI user documentation * Bump CLI version to 0.3.5 * Finalise docs & add to index.md - Amend where necessary - Fix typo in gpt4all_cli.md - Mention and add link to CLI doc in index.md * Add docstings to gpt4all-bindings/cli/app.py * Better 'groovy' link & fix typo - Documentation: point to the Hugging Face model card for 'groovy' - Correct typo in app.py 2023-06-23 15:09:31 -04:00			`"""GPT4All CLI`

			The GPT4All CLI is a self-contained script based on the `gpt4all` and `typer` packages. It offers a
			`REPL to communicate with a language model similar to the chat GUI application, but more basic.`
			`"""`

python: replace deprecated pkg_resources with importlib (#1505) 2023-10-12 13:35:27 -04:00			`import importlib.metadata`
Fix CLI to work with 1.x.y version of the Python bindings (#1120) * Fix CLI to work with 1.x.y version of the Python bindings (tentative) - Adapted to bindings API changes - Version selection based on package information - Does not currently work with 1.x.y however, as it's not fully implemented: "NotImplementedError: Streaming tokens in a chat session is not currently supported." * Adapt to the completed streaming API with session support * Bump CLI version to 1.0.2 2023-07-05 22:42:15 -04:00			`import io`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`import sys`
CLI Improvements (#1021) * Add gpt4all-bindings/cli/README.md * Unify version information - Was previously split; base one on the other - Add VERSION_INFO as the "source of truth": - Modelled after sys.version_info. - Implemented as a tuple, because it's much easier for (partial) programmatic comparison. - Previous API is kept intact. * Add gpt4all-bindings/cli/developer_notes.md - A few notes on what's what, especially regarding docs * Add gpt4all-bindings/python/docs/gpt4all_cli.md - The CLI user documentation * Bump CLI version to 0.3.5 * Finalise docs & add to index.md - Amend where necessary - Fix typo in gpt4all_cli.md - Mention and add link to CLI doc in index.md * Add docstings to gpt4all-bindings/cli/app.py * Better 'groovy' link & fix typo - Documentation: point to the Hugging Face model card for 'groovy' - Correct typo in app.py 2023-06-23 15:09:31 -04:00			`from collections import namedtuple`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`from typing_extensions import Annotated`
python: replace deprecated pkg_resources with importlib (#1505) 2023-10-12 13:35:27 -04:00
			`import typer`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`from gpt4all import GPT4All`

CLI Improvements (#1021) * Add gpt4all-bindings/cli/README.md * Unify version information - Was previously split; base one on the other - Add VERSION_INFO as the "source of truth": - Modelled after sys.version_info. - Implemented as a tuple, because it's much easier for (partial) programmatic comparison. - Previous API is kept intact. * Add gpt4all-bindings/cli/developer_notes.md - A few notes on what's what, especially regarding docs * Add gpt4all-bindings/python/docs/gpt4all_cli.md - The CLI user documentation * Bump CLI version to 0.3.5 * Finalise docs & add to index.md - Amend where necessary - Fix typo in gpt4all_cli.md - Mention and add link to CLI doc in index.md * Add docstings to gpt4all-bindings/cli/app.py * Better 'groovy' link & fix typo - Documentation: point to the Hugging Face model card for 'groovy' - Correct typo in app.py 2023-06-23 15:09:31 -04:00
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`MESSAGES = [`
			`{"role": "system", "content": "You are a helpful assistant."},`
			`{"role": "user", "content": "Hello there."},`
			`{"role": "assistant", "content": "Hi, how can I help you?"},`
			`]`

			`SPECIAL_COMMANDS = {`
			`"/reset": lambda messages: messages.clear(),`
			`"/exit": lambda _: sys.exit(),`
			`"/clear": lambda _: print("\n" * 100),`
			`"/help": lambda _: print("Special commands: /reset, /exit, /help and /clear"),`
			`}`

CLI Improvements (#1021) * Add gpt4all-bindings/cli/README.md * Unify version information - Was previously split; base one on the other - Add VERSION_INFO as the "source of truth": - Modelled after sys.version_info. - Implemented as a tuple, because it's much easier for (partial) programmatic comparison. - Previous API is kept intact. * Add gpt4all-bindings/cli/developer_notes.md - A few notes on what's what, especially regarding docs * Add gpt4all-bindings/python/docs/gpt4all_cli.md - The CLI user documentation * Bump CLI version to 0.3.5 * Finalise docs & add to index.md - Amend where necessary - Fix typo in gpt4all_cli.md - Mention and add link to CLI doc in index.md * Add docstings to gpt4all-bindings/cli/app.py * Better 'groovy' link & fix typo - Documentation: point to the Hugging Face model card for 'groovy' - Correct typo in app.py 2023-06-23 15:09:31 -04:00			`VersionInfo = namedtuple('VersionInfo', ['major', 'minor', 'micro'])`
Fix CLI to work with 1.x.y version of the Python bindings (#1120) * Fix CLI to work with 1.x.y version of the Python bindings (tentative) - Adapted to bindings API changes - Version selection based on package information - Does not currently work with 1.x.y however, as it's not fully implemented: "NotImplementedError: Streaming tokens in a chat session is not currently supported." * Adapt to the completed streaming API with session support * Bump CLI version to 1.0.2 2023-07-05 22:42:15 -04:00			`VERSION_INFO = VersionInfo(1, 0, 2)`
CLI Improvements (#1021) * Add gpt4all-bindings/cli/README.md * Unify version information - Was previously split; base one on the other - Add VERSION_INFO as the "source of truth": - Modelled after sys.version_info. - Implemented as a tuple, because it's much easier for (partial) programmatic comparison. - Previous API is kept intact. * Add gpt4all-bindings/cli/developer_notes.md - A few notes on what's what, especially regarding docs * Add gpt4all-bindings/python/docs/gpt4all_cli.md - The CLI user documentation * Bump CLI version to 0.3.5 * Finalise docs & add to index.md - Amend where necessary - Fix typo in gpt4all_cli.md - Mention and add link to CLI doc in index.md * Add docstings to gpt4all-bindings/cli/app.py * Better 'groovy' link & fix typo - Documentation: point to the Hugging Face model card for 'groovy' - Correct typo in app.py 2023-06-23 15:09:31 -04:00			`VERSION = '.'.join(map(str, VERSION_INFO)) # convert to string form, like: '1.2.3'`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00
			`CLI_START_MESSAGE = f"""`

			`██████ ██████ ████████ ██ ██ █████ ██ ██`
			`██ ██ ██ ██ ██ ██ ██ ██ ██ ██`
			`██ ███ ██████ ██ ███████ ███████ ██ ██`
			`██ ██ ██ ██ ██ ██ ██ ██ ██`
			`██████ ██ ██ ██ ██ ██ ███████ ███████`


			`Welcome to the GPT4All CLI! Version {VERSION}`
			`Type /help for special commands.`

			`"""`

			`# create typer app`
			`app = typer.Typer()`

			`@app.command()`
			`def repl(`
			`model: Annotated[`
			`str,`
			`typer.Option("--model", "-m", help="Model to use for chatbot"),`
app.py: change default model to Mistral Instruct (#1564) 2023-10-24 12:43:30 -04:00			`] = "mistral-7b-instruct-v0.1.Q4_0.gguf",`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`n_threads: Annotated[`
			`int,`
			`typer.Option("--n-threads", "-t", help="Number of threads to use for chatbot"),`
Do not ignore explicitly passed 4 threads 2023-05-25 11:53:39 -04:00			`] = None,`
app.py: add --device option for GPU support (#1769) Signed-off-by: Daniel Salvatierra <dsalvat1@gmail.com> Co-authored-by: Jared Van Bortel <jared@nomic.ai> 2023-12-20 16:01:03 -05:00			`device: Annotated[`
			`str,`
			`typer.Option("--device", "-d", help="Device to use for chatbot, e.g. gpu, amd, nvidia, intel. Defaults to CPU."),`
			`] = None,`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`):`
CLI Improvements (#1021) * Add gpt4all-bindings/cli/README.md * Unify version information - Was previously split; base one on the other - Add VERSION_INFO as the "source of truth": - Modelled after sys.version_info. - Implemented as a tuple, because it's much easier for (partial) programmatic comparison. - Previous API is kept intact. * Add gpt4all-bindings/cli/developer_notes.md - A few notes on what's what, especially regarding docs * Add gpt4all-bindings/python/docs/gpt4all_cli.md - The CLI user documentation * Bump CLI version to 0.3.5 * Finalise docs & add to index.md - Amend where necessary - Fix typo in gpt4all_cli.md - Mention and add link to CLI doc in index.md * Add docstings to gpt4all-bindings/cli/app.py * Better 'groovy' link & fix typo - Documentation: point to the Hugging Face model card for 'groovy' - Correct typo in app.py 2023-06-23 15:09:31 -04:00			`"""The CLI read-eval-print loop."""`
app.py: add --device option for GPU support (#1769) Signed-off-by: Daniel Salvatierra <dsalvat1@gmail.com> Co-authored-by: Jared Van Bortel <jared@nomic.ai> 2023-12-20 16:01:03 -05:00			`gpt4all_instance = GPT4All(model, device=device)`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00
			`# if threads are passed, set them`
Do not ignore explicitly passed 4 threads 2023-05-25 11:53:39 -04:00			`if n_threads is not None:`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`num_threads = gpt4all_instance.model.thread_count()`
			`print(f"\nAdjusted: {num_threads} →", end="")`

			`# set number of threads`
			`gpt4all_instance.model.set_thread_count(n_threads)`

			`num_threads = gpt4all_instance.model.thread_count()`
			`print(f" {num_threads} threads", end="", flush=True)`
Do not ignore explicitly passed 4 threads 2023-05-25 11:53:39 -04:00			`else:`
			`print(f"\nUsing {gpt4all_instance.model.thread_count()} threads", end="")`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00
			`print(CLI_START_MESSAGE)`

Fix CLI to work with 1.x.y version of the Python bindings (#1120) * Fix CLI to work with 1.x.y version of the Python bindings (tentative) - Adapted to bindings API changes - Version selection based on package information - Does not currently work with 1.x.y however, as it's not fully implemented: "NotImplementedError: Streaming tokens in a chat session is not currently supported." * Adapt to the completed streaming API with session support * Bump CLI version to 1.0.2 2023-07-05 22:42:15 -04:00			`use_new_loop = False`
			`try:`
python: replace deprecated pkg_resources with importlib (#1505) 2023-10-12 13:35:27 -04:00			`version = importlib.metadata.version('gpt4all')`
Fix CLI to work with 1.x.y version of the Python bindings (#1120) * Fix CLI to work with 1.x.y version of the Python bindings (tentative) - Adapted to bindings API changes - Version selection based on package information - Does not currently work with 1.x.y however, as it's not fully implemented: "NotImplementedError: Streaming tokens in a chat session is not currently supported." * Adapt to the completed streaming API with session support * Bump CLI version to 1.0.2 2023-07-05 22:42:15 -04:00			`version_major = int(version.split('.')[0])`
			`if version_major >= 1:`
			`use_new_loop = True`
			`except:`
			`pass # fall back to old loop`
			`if use_new_loop:`
			`_new_loop(gpt4all_instance)`
			`else:`
			`_old_loop(gpt4all_instance)`


			`def _old_loop(gpt4all_instance):`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`while True:`
			`message = input(" ⇢ ")`

			`# Check if special command and take action`
			`if message in SPECIAL_COMMANDS:`
			`SPECIAL_COMMANDS[message](MESSAGES)`
			`continue`

			`# if regular message, append to messages`
			`MESSAGES.append({"role": "user", "content": message})`

			`# execute chat completion and ignore the full response since`
			`# we are outputting it incrementally`
			`full_response = gpt4all_instance.chat_completion(`
			`MESSAGES,`
			`# preferential kwargs for chat ux`
			`logits_size=0,`
			`tokens_size=0,`
			`n_past=0,`
			`n_ctx=0,`
			`n_predict=200,`
			`top_k=40,`
			`top_p=0.9,`
			`temp=0.9,`
			`n_batch=9,`
			`repeat_penalty=1.1,`
			`repeat_last_n=64,`
			`context_erase=0.0,`
			`# required kwargs for cli ux (incremental response)`
			`verbose=False,`
Fix CLI app.py (#910) - the bindings API changed in 057b9, but the CLI was not updated - change 'std_passthrough' param to the renamed 'streaming' - remove '_cli_override_response_callback' as it breaks and is no longer needed - bump version to 0.3.4 2023-06-16 16:06:22 -04:00			`streaming=True,`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`)`
			`# record assistant's response to messages`
			`MESSAGES.append(full_response.get("choices")[0].get("message"))`
			`print() # newline before next prompt`


Fix CLI to work with 1.x.y version of the Python bindings (#1120) * Fix CLI to work with 1.x.y version of the Python bindings (tentative) - Adapted to bindings API changes - Version selection based on package information - Does not currently work with 1.x.y however, as it's not fully implemented: "NotImplementedError: Streaming tokens in a chat session is not currently supported." * Adapt to the completed streaming API with session support * Bump CLI version to 1.0.2 2023-07-05 22:42:15 -04:00			`def _new_loop(gpt4all_instance):`
			`with gpt4all_instance.chat_session():`
			`while True:`
			`message = input(" ⇢ ")`

			`# Check if special command and take action`
			`if message in SPECIAL_COMMANDS:`
			`SPECIAL_COMMANDS[message](MESSAGES)`
			`continue`

			`# if regular message, append to messages`
			`MESSAGES.append({"role": "user", "content": message})`

			`# execute chat completion and ignore the full response since`
			`# we are outputting it incrementally`
			`response_generator = gpt4all_instance.generate(`
			`message,`
			`# preferential kwargs for chat ux`
			`max_tokens=200,`
			`temp=0.9,`
			`top_k=40,`
			`top_p=0.9,`
			`repeat_penalty=1.1,`
			`repeat_last_n=64,`
			`n_batch=9,`
			`# required kwargs for cli ux (incremental response)`
			`streaming=True,`
			`)`
			`response = io.StringIO()`
			`for token in response_generator:`
			`print(token, end='', flush=True)`
			`response.write(token)`

			`# record assistant's response to messages`
			`response_message = {'role': 'assistant', 'content': response.getvalue()}`
			`response.close()`
			`gpt4all_instance.current_chat_session.append(response_message)`
			`MESSAGES.append(response_message)`
			`print() # newline before next prompt`


adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00			`@app.command()`
			`def version():`
CLI Improvements (#1021) * Add gpt4all-bindings/cli/README.md * Unify version information - Was previously split; base one on the other - Add VERSION_INFO as the "source of truth": - Modelled after sys.version_info. - Implemented as a tuple, because it's much easier for (partial) programmatic comparison. - Previous API is kept intact. * Add gpt4all-bindings/cli/developer_notes.md - A few notes on what's what, especially regarding docs * Add gpt4all-bindings/python/docs/gpt4all_cli.md - The CLI user documentation * Bump CLI version to 0.3.5 * Finalise docs & add to index.md - Amend where necessary - Fix typo in gpt4all_cli.md - Mention and add link to CLI doc in index.md * Add docstings to gpt4all-bindings/cli/app.py * Better 'groovy' link & fix typo - Documentation: point to the Hugging Face model card for 'groovy' - Correct typo in app.py 2023-06-23 15:09:31 -04:00			`"""The CLI version command."""`
			`print(f"gpt4all-cli v{VERSION}")`
adds a simple cli chat repl (#566) * adds a simple cli chat repl * add n thread support and append assistant response 2023-05-16 16:47:54 -04:00

			`if __name__ == "__main__":`
			`app()`