Update Multimodal notebook
This commit is contained in:
parent
b30b9c338b
commit
598780fde8
1 changed files with 15 additions and 18 deletions
|
@ -1,5 +1,14 @@
|
||||||
{
|
{
|
||||||
"cells": [
|
"cells": [
|
||||||
|
{
|
||||||
|
"cell_type": "markdown",
|
||||||
|
"metadata": {},
|
||||||
|
"source": [
|
||||||
|
"<div>\n",
|
||||||
|
" <img src=\"https://user-images.githubusercontent.com/1991296/230134379-7181e485-c521-4d23-a0d6-f7b3b61ba524.png\" width=\"500\"/>\n",
|
||||||
|
"</div>"
|
||||||
|
]
|
||||||
|
},
|
||||||
{
|
{
|
||||||
"cell_type": "code",
|
"cell_type": "code",
|
||||||
"execution_count": 1,
|
"execution_count": 1,
|
||||||
|
@ -9,19 +18,13 @@
|
||||||
"name": "stdout",
|
"name": "stdout",
|
||||||
"output_type": "stream",
|
"output_type": "stream",
|
||||||
"text": [
|
"text": [
|
||||||
"ChatCompletion(id='chatcmpl-65a710ba-41d1-4d0a-a124-a44b2b4a0189', choices=[Choice(finish_reason='stop', index=0, message=ChatCompletionMessage(content=' The image reads \"LlamaC++.\"', role='assistant', function_call=None, tool_calls=None))], created=1699413274, model='gpt-4-vision-preview', object='chat.completion', system_fingerprint=None, usage=CompletionUsage(completion_tokens=10, prompt_tokens=624, total_tokens=634))\n"
|
"{'text': 'Llama C++'}\n"
|
||||||
]
|
]
|
||||||
}
|
}
|
||||||
],
|
],
|
||||||
"source": [
|
"source": [
|
||||||
"from openai import OpenAI\n",
|
"from openai import OpenAI\n",
|
||||||
"\n",
|
"\n",
|
||||||
"import urllib.request\n",
|
|
||||||
"import base64\n",
|
|
||||||
"\n",
|
|
||||||
"def get_data_url(url):\n",
|
|
||||||
" return \"data:image/png;base64,\" + base64.b64encode(urllib.request.urlopen(url).read()).decode(\"utf-8\")\n",
|
|
||||||
"\n",
|
|
||||||
"client = OpenAI(base_url=\"http://100.64.159.73:8000/v1\", api_key=\"sk-1234\")\n",
|
"client = OpenAI(base_url=\"http://100.64.159.73:8000/v1\", api_key=\"sk-1234\")\n",
|
||||||
"response = client.chat.completions.create(\n",
|
"response = client.chat.completions.create(\n",
|
||||||
" model=\"gpt-4-vision-preview\",\n",
|
" model=\"gpt-4-vision-preview\",\n",
|
||||||
|
@ -32,23 +35,17 @@
|
||||||
" {\n",
|
" {\n",
|
||||||
" \"type\": \"image_url\",\n",
|
" \"type\": \"image_url\",\n",
|
||||||
" \"image_url\": {\n",
|
" \"image_url\": {\n",
|
||||||
" \"url\": get_data_url(\"https://user-images.githubusercontent.com/1991296/230134379-7181e485-c521-4d23-a0d6-f7b3b61ba524.png\"),\n",
|
" \"url\": \"https://user-images.githubusercontent.com/1991296/230134379-7181e485-c521-4d23-a0d6-f7b3b61ba524.png\",\n",
|
||||||
" # \"url\": \"https://user-images.githubusercontent.com/1991296/230134379-7181e485-c521-4d23-a0d6-f7b3b61ba524.png\",\n",
|
|
||||||
" },\n",
|
" },\n",
|
||||||
" },\n",
|
" },\n",
|
||||||
" {\"type\": \"text\", \"text\": \"What does the image say\"},\n",
|
" {\"type\": \"text\", \"text\": \"What does the image say. Format your response as a json object with a single 'text' key.\"},\n",
|
||||||
" ],\n",
|
" ],\n",
|
||||||
" }\n",
|
" }\n",
|
||||||
" ],\n",
|
" ],\n",
|
||||||
|
" response_format={ \"type\": \"json_object\" }\n",
|
||||||
")\n",
|
")\n",
|
||||||
"print(response)"
|
"import json\n",
|
||||||
]
|
"print(json.loads(response.choices[0].message.content))"
|
||||||
},
|
|
||||||
{
|
|
||||||
"cell_type": "markdown",
|
|
||||||
"metadata": {},
|
|
||||||
"source": [
|
|
||||||
"![](https://user-images.githubusercontent.com/1991296/230134379-7181e485-c521-4d23-a0d6-f7b3b61ba524.png)"
|
|
||||||
]
|
]
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
|
|
Loading…
Reference in a new issue