ollama/examples/python-simplegenerate/client.py

import json
import requests

# NOTE: ollama must be running for this to work, start the ollama app or run `ollama serve`
model = 'llama2' # TODO: update this for whatever model you wish to use

def generate(prompt, context):
    r = requests.post('http://localhost:11434/api/generate',
                      json={
                          'model': model,
                          'prompt': prompt,
                          'context': context,
                      },
                      stream=True)
    r.raise_for_status()

    for line in r.iter_lines():
        body = json.loads(line)
        response_part = body.get('response', '')
        # the response streams one token at a time, print that as we receive it
        print(response_part, end='', flush=True)

        if 'error' in body:
            raise Exception(body['error'])

        if body.get('done', False):
            return body['context']

def main():
    context = [] # the context stores a conversation history, you can use this to make the model more context aware
    while True:
        user_input = input("Enter a prompt: ")
        print()
        context = generate(user_input, context)
        print()

if __name__ == "__main__":
    main()
python example 2023-08-14 18:27:13 +00:00			`import json`
			`import requests`

			# NOTE: ollama must be running for this to work, start the ollama app or run `ollama serve`
			`model = 'llama2' # TODO: update this for whatever model you wish to use`

update python example 2023-08-14 19:38:44 +00:00			`def generate(prompt, context):`
python example 2023-08-14 18:27:13 +00:00			`r = requests.post('http://localhost:11434/api/generate',`
			`json={`
			`'model': model,`
			`'prompt': prompt,`
			`'context': context,`
			`},`
			`stream=True)`
			`r.raise_for_status()`

			`for line in r.iter_lines():`
			`body = json.loads(line)`
			`response_part = body.get('response', '')`
Update client.py (#1026) recieve -> receive 2023-11-07 17:55:47 +00:00			`# the response streams one token at a time, print that as we receive it`
python example 2023-08-14 18:27:13 +00:00			`print(response_part, end='', flush=True)`

			`if 'error' in body:`
			`raise Exception(body['error'])`

			`if body.get('done', False):`
update python example 2023-08-14 19:38:44 +00:00			`return body['context']`
python example 2023-08-14 18:27:13 +00:00
			`def main():`
update python example 2023-08-14 19:38:44 +00:00			`context = [] # the context stores a conversation history, you can use this to make the model more context aware`
python example 2023-08-14 18:27:13 +00:00			`while True:`
			`user_input = input("Enter a prompt: ")`
			`print()`
update python example 2023-08-14 19:38:44 +00:00			`context = generate(user_input, context)`
python example 2023-08-14 18:27:13 +00:00			`print()`

			`if __name__ == "__main__":`
Update client.py (#1026) recieve -> receive 2023-11-07 17:55:47 +00:00			`main()`