consistency between generate and add naming

2023-06-29 18:22:45 -04:00 · 2023-06-29 18:22:45 -04:00 · 01c31aac78
commit 01c31aac78
parent 8fc8a00752
3 changed files with 38 additions and 30 deletions
--- a/ollama/cmd/cli.py
+++ b/ollama/cmd/cli.py
@ -79,14 +79,18 @@ def generate_oneshot(*args, **kwargs):
    spinner = yaspin()
    spinner.start()
    spinner_running = True
-    for output in engine.generate(*args, **kwargs):
-        choices = output.get("choices", [])
-        if len(choices) > 0:
-            if spinner_running:
-                spinner.stop()
-                spinner_running = False
-                print("\r", end="")  # move cursor back to beginning of line again
-            print(choices[0].get("text", ""), end="", flush=True)
+    try:
+        for output in engine.generate(*args, **kwargs):
+            choices = output.get("choices", [])
+            if len(choices) > 0:
+                if spinner_running:
+                    spinner.stop()
+                    spinner_running = False
+                    print("\r", end="")  # move cursor back to beginning of line again
+                print(choices[0].get("text", ""), end="", flush=True)
+    except Exception:
+        spinner.stop()
+        raise

    # end with a new line
    print(flush=True)
--- a/ollama/engine.py
+++ b/ollama/engine.py
@ -1,5 +1,4 @@
-import os
-import json
+from os import path, dup, dup2, devnull
 import sys
 from contextlib import contextmanager
 from llama_cpp import Llama as LLM
@ -10,12 +9,12 @@ import ollama.prompt

@contextmanager
 def suppress_stderr():
-    stderr = os.dup(sys.stderr.fileno())
-    with open(os.devnull, "w") as devnull:
-        os.dup2(devnull.fileno(), sys.stderr.fileno())
+    stderr = dup(sys.stderr.fileno())
+    with open(devnull, "w") as devnull:
+        dup2(devnull.fileno(), sys.stderr.fileno())
        yield

-    os.dup2(stderr, sys.stderr.fileno())
+    dup2(stderr, sys.stderr.fileno())


 def generate(model, prompt, models_home=".", llms={}, *args, **kwargs):
@ -38,12 +37,15 @@ def generate(model, prompt, models_home=".", llms={}, *args, **kwargs):
 def load(model, models_home=".", llms={}):
    llm = llms.get(model, None)
    if not llm:
-        stored_model_path = os.path.join(models_home, model, ".bin")
-        if os.path.exists(stored_model_path):
+        stored_model_path = path.join(models_home, model) + ".bin"
+        if path.exists(stored_model_path):
            model_path = stored_model_path
        else:
            # try loading this as a path to a model, rather than a model name
-            model_path = os.path.abspath(model)
+            model_path = path.abspath(model)
+
+        if not path.exists(model_path):
+            raise Exception(f"Model not found: {model}")

        try:
            # suppress LLM's output
--- a/ollama/model.py
+++ b/ollama/model.py
@ -1,6 +1,6 @@
-import os
 import requests
 import validators
+from os import path, walk
 from urllib.parse import urlsplit, urlunsplit
 from tqdm import tqdm

@ -9,9 +9,9 @@ models_endpoint_url = 'https://ollama.ai/api/models'


 def models(models_home='.', *args, **kwargs):
-    for _, _, files in os.walk(models_home):
+    for _, _, files in walk(models_home):
        for file in files:
-            base, ext = os.path.splitext(file)
+            base, ext = path.splitext(file)
            if ext == '.bin':
                yield base

@ -27,7 +27,7 @@ def get_url_from_directory(model):
    return model


-def download_from_repo(url, models_home='.'):
+def download_from_repo(url, file_name, models_home='.'):
    parts = urlsplit(url)
    path_parts = parts.path.split('/tree/')

@ -38,6 +38,8 @@ def download_from_repo(url, models_home='.'):
        location, branch = path_parts

    location = location.strip('/')
+    if file_name == '':
+        file_name = path.basename(location)

    download_url = urlunsplit(
        (
@ -53,7 +55,7 @@ def download_from_repo(url, models_home='.'):
    json_response = response.json()

    download_url, file_size = find_bin_file(json_response, location, branch)
-    return download_file(download_url, models_home, location, file_size)
+    return download_file(download_url, models_home, file_name, file_size)


 def find_bin_file(json_response, location, branch):
@ -73,17 +75,15 @@ def find_bin_file(json_response, location, branch):
    return download_url, file_size


-def download_file(download_url, models_home, location, file_size):
-    local_filename = os.path.join(models_home, os.path.basename(location)) + '.bin'
+def download_file(download_url, models_home, file_name, file_size):
+    local_filename = path.join(models_home, file_name) + '.bin'

-    first_byte = (
-        os.path.getsize(local_filename) if os.path.exists(local_filename) else 0
-    )
+    first_byte = path.getsize(local_filename) if path.exists(local_filename) else 0

    if first_byte >= file_size:
        return local_filename

-    print(f'Pulling {os.path.basename(location)}...')
+    print(f'Pulling {file_name}...')

    header = {'Range': f'bytes={first_byte}-'} if first_byte != 0 else {}

@ -109,13 +109,15 @@ def download_file(download_url, models_home, location, file_size):


 def pull(model, models_home='.', *args, **kwargs):
-    if os.path.exists(model):
+    if path.exists(model):
        # a file on the filesystem is being specified
        return model
    # check the remote model location and see if it needs to be downloaded
    url = model
+    file_name = ""
    if not validators.url(url) and not url.startswith('huggingface.co'):
        url = get_url_from_directory(model)
+        file_name = model

    if not (url.startswith('http://') or url.startswith('https://')):
        url = f'https://{url}'
@ -126,6 +128,6 @@ def pull(model, models_home='.', *args, **kwargs):
            return model
        raise Exception(f'Unknown model {model}')

-    local_filename = download_from_repo(url, models_home)
+    local_filename = download_from_repo(url, file_name, models_home)

    return local_filename