Feat/sdk vision support (#1531)

Co-authored-by: Joel <iamjoel007@gmail.com>
This commit is contained in:
Garfield Dai 2023-11-20 17:54:01 +08:00 committed by GitHub
parent ac3496e681
commit 5b7071e4b0
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
11 changed files with 319 additions and 62 deletions

View File

@ -26,6 +26,9 @@ class FileApi(AppApiResource):
if 'file' not in request.files: if 'file' not in request.files:
raise NoFileUploadedError() raise NoFileUploadedError()
if not file.mimetype:
raise UnsupportedFileTypeError()
if len(request.files) > 1: if len(request.files) > 1:
raise TooManyFilesError() raise TooManyFilesError()

View File

@ -14,27 +14,33 @@ import { DifyClient, ChatClient, CompletionClient } from 'dify-client'
const API_KEY = 'your-api-key-here' const API_KEY = 'your-api-key-here'
const user = `random-user-id` const user = `random-user-id`
const inputs = { const query = 'Please tell me a short story in 10 words or less.'
name: 'test name a' const remote_url_files = [{
} type: 'image',
const query = "Please tell me a short story in 10 words or less." transfer_method: 'remote_url',
url: 'your_url_addresss'
}]
// Create a completion client // Create a completion client
const completionClient = new CompletionClient(API_KEY) const completionClient = new CompletionClient(API_KEY)
// Create a completion message // Create a completion message
completionClient.createCompletionMessage(inputs, query, responseMode, user) completionClient.createCompletionMessage({'query': query}, user)
// Create a completion message with vision model
completionClient.createCompletionMessage({'query': 'Describe the picture.'}, user, false, remote_url_files)
// Create a chat client // Create a chat client
const chatClient = new ChatClient(API_KEY) const chatClient = new ChatClient(API_KEY)
// Create a chat message in stream mode // Create a chat message in stream mode
const response = await chatClient.createChatMessage(inputs, query, user, true, null) const response = await chatClient.createChatMessage({}, query, user, true, null)
const stream = response.data; const stream = response.data;
stream.on('data', data => { stream.on('data', data => {
console.log(data); console.log(data);
}); });
stream.on('end', () => { stream.on('end', () => {
console.log("stream done"); console.log('stream done');
}); });
// Create a chat message with vision model
chatClient.createChatMessage({}, 'Describe the picture.', user, false, null, remote_url_files)
// Fetch conversations // Fetch conversations
chatClient.getConversations(user) chatClient.getConversations(user)
// Fetch conversation messages // Fetch conversation messages

View File

@ -34,6 +34,10 @@ export const routes = {
method: "DELETE", method: "DELETE",
url: (conversation_id) => `/conversations/${conversation_id}`, url: (conversation_id) => `/conversations/${conversation_id}`,
}, },
fileUpload: {
method: "POST",
url: () => `/files/upload`,
}
}; };
export class DifyClient { export class DifyClient {
@ -51,11 +55,15 @@ export class DifyClient {
endpoint, endpoint,
data = null, data = null,
params = null, params = null,
stream = false stream = false,
headerParams = {}
) { ) {
const headers = { const headers = {
Authorization: `Bearer ${this.apiKey}`, ...{
"Content-Type": "application/json", Authorization: `Bearer ${this.apiKey}`,
"Content-Type": "application/json",
},
...headerParams
}; };
const url = `${this.baseUrl}${endpoint}`; const url = `${this.baseUrl}${endpoint}`;
@ -104,15 +112,28 @@ export class DifyClient {
params params
); );
} }
fileUpload(data) {
return this.sendRequest(
routes.fileUpload.method,
routes.fileUpload.url(),
data,
null,
false,
{
"Content-Type": 'multipart/form-data'
}
);
}
} }
export class CompletionClient extends DifyClient { export class CompletionClient extends DifyClient {
createCompletionMessage(inputs, query, user, stream = false) { createCompletionMessage(inputs, user, stream = false, files = null) {
const data = { const data = {
inputs, inputs,
query,
user, user,
response_mode: stream ? "streaming" : "blocking", response_mode: stream ? "streaming" : "blocking",
files,
}; };
return this.sendRequest( return this.sendRequest(
routes.createCompletionMessage.method, routes.createCompletionMessage.method,
@ -130,13 +151,15 @@ export class ChatClient extends DifyClient {
query, query,
user, user,
stream = false, stream = false,
conversation_id = null conversation_id = null,
files = null
) { ) {
const data = { const data = {
inputs, inputs,
query, query,
user, user,
response_mode: stream ? "streaming" : "blocking", response_mode: stream ? "streaming" : "blocking",
files,
}; };
if (conversation_id) data.conversation_id = conversation_id; if (conversation_id) data.conversation_id = conversation_id;

View File

@ -1,6 +1,6 @@
{ {
"name": "dify-client", "name": "dify-client",
"version": "2.0.0", "version": "2.1.0",
"description": "This is the Node.js SDK for the Dify.AI API, which allows you to easily integrate Dify.AI into your Node.js applications.", "description": "This is the Node.js SDK for the Dify.AI API, which allows you to easily integrate Dify.AI into your Node.js applications.",
"main": "index.js", "main": "index.js",
"type": "module", "type": "module",

View File

@ -11,7 +11,7 @@ This is the PHP SDK for the Dify API, which allows you to easily integrate Dify
After installing the SDK, you can use it in your project like this: After installing the SDK, you can use it in your project like this:
``` ```php
<?php <?php
require 'vendor/autoload.php'; require 'vendor/autoload.php';
@ -26,17 +26,50 @@ $difyClient = new DifyClient($apiKey);
// Create a completion client // Create a completion client
$completionClient = new CompletionClient($apiKey); $completionClient = new CompletionClient($apiKey);
$response = $completionClient->create_completion_message($inputs, $query, $response_mode, $user); $response = $completionClient->create_completion_message(array("query" => "Who are you?"), "blocking", "user_id");
// Create a chat client // Create a chat client
$chatClient = new ChatClient($apiKey); $chatClient = new ChatClient($apiKey);
$response = $chatClient->create_chat_message($inputs, $query, $user, $response_mode, $conversation_id); $response = $chatClient->create_chat_message(array(), "Who are you?", "user_id", "blocking", $conversation_id);
$fileForVision = [
[
"type" => "image",
"transfer_method" => "remote_url",
"url" => "your_image_url"
]
];
// $fileForVision = [
// [
// "type" => "image",
// "transfer_method" => "local_file",
// "url" => "your_file_id"
// ]
// ];
// Create a completion client with vision model like gpt-4-vision
$response = $completionClient->create_completion_message(array("query" => "Describe this image."), "blocking", "user_id", $fileForVision);
// Create a chat client with vision model like gpt-4-vision
$response = $chatClient->create_chat_message(array(), "Describe this image.", "user_id", "blocking", $conversation_id, $fileForVision);
// File Upload
$fileForUpload = [
[
'tmp_name' => '/path/to/file/filename.jpg',
'name' => 'filename.jpg'
]
];
$response = $difyClient->file_upload("user_id", $fileForUpload);
$result = json_decode($response->getBody(), true);
echo 'upload_file_id: ' . $result['id'];
// Fetch application parameters // Fetch application parameters
$response = $difyClient->get_application_parameters($user); $response = $difyClient->get_application_parameters("user_id");
// Provide feedback for a message // Provide feedback for a message
$response = $difyClient->message_feedback($message_id, $rating, $user); $response = $difyClient->message_feedback($message_id, $rating, "user_id");
// Other available methods: // Other available methods:
// - get_conversation_messages() // - get_conversation_messages()

View File

@ -19,6 +19,13 @@ class DifyClient {
'Content-Type' => 'application/json', 'Content-Type' => 'application/json',
], ],
]); ]);
$this->file_client = new Client([
'base_uri' => $this->base_url,
'headers' => [
'Authorization' => 'Bearer ' . $this->api_key,
'Content-Type' => 'multipart/form-data',
],
]);
} }
protected function send_request($method, $endpoint, $data = null, $params = null, $stream = false) { protected function send_request($method, $endpoint, $data = null, $params = null, $stream = false) {
@ -44,27 +51,57 @@ class DifyClient {
$params = ['user' => $user]; $params = ['user' => $user];
return $this->send_request('GET', 'parameters', null, $params); return $this->send_request('GET', 'parameters', null, $params);
} }
public function file_upload($user, $files) {
$data = ['user' => $user];
$options = [
'multipart' => $this->prepareMultipart($data, $files)
];
return $this->file_client->request('POST', 'files/upload', $options);
}
protected function prepareMultipart($data, $files) {
$multipart = [];
foreach ($data as $key => $value) {
$multipart[] = [
'name' => $key,
'contents' => $value
];
}
foreach ($files as $file) {
$multipart[] = [
'name' => 'file',
'contents' => fopen($file['tmp_name'], 'r'),
'filename' => $file['name']
];
}
return $multipart;
}
} }
class CompletionClient extends DifyClient { class CompletionClient extends DifyClient {
public function create_completion_message($inputs, $query, $response_mode, $user) { public function create_completion_message($inputs, $response_mode, $user, $files = null) {
$data = [ $data = [
'inputs' => $inputs, 'inputs' => $inputs,
'query' => $query,
'response_mode' => $response_mode, 'response_mode' => $response_mode,
'user' => $user, 'user' => $user,
'files' => $files,
]; ];
return $this->send_request('POST', 'completion-messages', $data, null, $response_mode === 'streaming'); return $this->send_request('POST', 'completion-messages', $data, null, $response_mode === 'streaming');
} }
} }
class ChatClient extends DifyClient { class ChatClient extends DifyClient {
public function create_chat_message($inputs, $query, $user, $response_mode = 'blocking', $conversation_id = null) { public function create_chat_message($inputs, $query, $user, $response_mode = 'blocking', $conversation_id = null, $files = null) {
$data = [ $data = [
'inputs' => $inputs, 'inputs' => $inputs,
'query' => $query, 'query' => $query,
'user' => $user, 'user' => $user,
'response_mode' => $response_mode, 'response_mode' => $response_mode,
'files' => $files,
]; ];
if ($conversation_id) { if ($conversation_id) {
$data['conversation_id'] = $conversation_id; $data['conversation_id'] = $conversation_id;

View File

@ -14,8 +14,7 @@ Write your code with sdk:
- completion generate with `blocking` response_mode - completion generate with `blocking` response_mode
``` ```python
import json
from dify_client import CompletionClient from dify_client import CompletionClient
api_key = "your_api_key" api_key = "your_api_key"
@ -24,18 +23,50 @@ api_key = "your_api_key"
completion_client = CompletionClient(api_key) completion_client = CompletionClient(api_key)
# Create Completion Message using CompletionClient # Create Completion Message using CompletionClient
completion_response = completion_client.create_completion_message(inputs={}, query="Hello", response_mode="blocking", user="user_id") completion_response = completion_client.create_completion_message(inputs={"query": "What's the weather like today?"},
response_mode="blocking", user="user_id")
completion_response.raise_for_status() completion_response.raise_for_status()
result = completion_response.text result = completion_response.json()
result = json.loads(result)
print(result.get('answer'))
```
- completion using vision model, like gpt-4-vision
```python
from dify_client import CompletionClient
api_key = "your_api_key"
# Initialize CompletionClient
completion_client = CompletionClient(api_key)
files = [{
"type": "image",
"transfer_method": "remote_url",
"url": "your_image_url"
}]
# files = [{
# "type": "image",
# "transfer_method": "local_file",
# "upload_file_id": "your_file_id"
# }]
# Create Completion Message using CompletionClient
completion_response = completion_client.create_completion_message(inputs={"query": "Describe the picture."},
response_mode="blocking", user="user_id", files=files)
completion_response.raise_for_status()
result = completion_response.json()
print(result.get('answer')) print(result.get('answer'))
``` ```
- chat generate with `streaming` response_mode - chat generate with `streaming` response_mode
``` ```python
import json import json
from dify_client import ChatClient from dify_client import ChatClient
@ -55,10 +86,67 @@ for line in chat_response.iter_lines(decode_unicode=True):
print(line.get('answer')) print(line.get('answer'))
``` ```
- chat using vision model, like gpt-4-vision
```python
from dify_client import ChatClient
api_key = "your_api_key"
# Initialize ChatClient
chat_client = ChatClient(api_key)
files = [{
"type": "image",
"transfer_method": "remote_url",
"url": "your_image_url"
}]
# files = [{
# "type": "image",
# "transfer_method": "local_file",
# "upload_file_id": "your_file_id"
# }]
# Create Chat Message using ChatClient
chat_response = chat_client.create_chat_message(inputs={}, query="Describe the picture.", user="user_id",
response_mode="blocking", files=files)
chat_response.raise_for_status()
result = chat_response.json()
print(result.get("answer"))
```
- upload file when using vision model
```python
from dify_client import DifyClient
api_key = "your_api_key"
# Initialize Client
dify_client = DifyClient(api_key)
file_path = "your_image_file_path"
file_name = "panda.jpeg"
mime_type = "image/jpeg"
with open(file_path, "rb") as file:
files = {
"file": (file_name, file, mime_type)
}
response = dify_client.file_upload("user_id", files)
result = response.json()
print(f'upload_file_id: {result.get("id")}')
```
- Others - Others
``` ```python
import json
from dify_client import ChatClient from dify_client import ChatClient
api_key = "your_api_key" api_key = "your_api_key"
@ -69,32 +157,29 @@ client = ChatClient(api_key)
# Get App parameters # Get App parameters
parameters = client.get_application_parameters(user="user_id") parameters = client.get_application_parameters(user="user_id")
parameters.raise_for_status() parameters.raise_for_status()
parameters = json.loads(parameters.text)
print('[parameters]') print('[parameters]')
print(parameters) print(parameters.json())
# Get Conversation List (only for chat) # Get Conversation List (only for chat)
conversations = client.get_conversations(user="user_id") conversations = client.get_conversations(user="user_id")
conversations.raise_for_status() conversations.raise_for_status()
conversations = json.loads(conversations.text)
print('[conversations]') print('[conversations]')
print(conversations) print(conversations.json())
# Get Message List (only for chat) # Get Message List (only for chat)
messages = client.get_conversation_messages(user="user_id", conversation_id="conversation_id") messages = client.get_conversation_messages(user="user_id", conversation_id="conversation_id")
messages.raise_for_status() messages.raise_for_status()
messages = json.loads(messages.text)
print('[messages]') print('[messages]')
print(messages) print(messages.json())
# Rename Conversation (only for chat) # Rename Conversation (only for chat)
rename_conversation_response = client.rename_conversation(conversation_id="conversation_id", name="new_name", user="user_id") rename_conversation_response = client.rename_conversation(conversation_id="conversation_id",
name="new_name", user="user_id")
rename_conversation_response.raise_for_status() rename_conversation_response.raise_for_status()
rename_conversation_result = json.loads(rename_conversation_response.text)
print('[rename result]') print('[rename result]')
print(rename_conversation_result) print(rename_conversation_response.json())
``` ```

View File

@ -1 +1 @@
from dify_client.client import ChatClient, CompletionClient from dify_client.client import ChatClient, CompletionClient, DifyClient

View File

@ -6,14 +6,24 @@ class DifyClient:
self.api_key = api_key self.api_key = api_key
self.base_url = "https://api.dify.ai/v1" self.base_url = "https://api.dify.ai/v1"
def _send_request(self, method, endpoint, data=None, params=None, stream=False): def _send_request(self, method, endpoint, json=None, params=None, stream=False):
headers = { headers = {
"Authorization": f"Bearer {self.api_key}", "Authorization": f"Bearer {self.api_key}",
"Content-Type": "application/json" "Content-Type": "application/json"
} }
url = f"{self.base_url}{endpoint}" url = f"{self.base_url}{endpoint}"
response = requests.request(method, url, json=data, params=params, headers=headers, stream=stream) response = requests.request(method, url, json=json, params=params, headers=headers, stream=stream)
return response
def _send_request_with_files(self, method, endpoint, data, files):
headers = {
"Authorization": f"Bearer {self.api_key}"
}
url = f"{self.base_url}{endpoint}"
response = requests.request(method, url, data=data, headers=headers, files=files)
return response return response
@ -28,30 +38,39 @@ class DifyClient:
params = {"user": user} params = {"user": user}
return self._send_request("GET", "/parameters", params=params) return self._send_request("GET", "/parameters", params=params)
def file_upload(self, user, files):
class CompletionClient(DifyClient):
def create_completion_message(self, inputs, query, response_mode, user):
data = { data = {
"inputs": inputs,
"query": query,
"response_mode": response_mode,
"user": user "user": user
} }
return self._send_request("POST", "/completion-messages", data, stream=True if response_mode == "streaming" else False) return self._send_request_with_files("POST", "/files/upload", data=data, files=files)
class CompletionClient(DifyClient):
def create_completion_message(self, inputs, response_mode, user, files=None):
data = {
"inputs": inputs,
"response_mode": response_mode,
"user": user,
"files": files
}
return self._send_request("POST", "/completion-messages", data,
stream=True if response_mode == "streaming" else False)
class ChatClient(DifyClient): class ChatClient(DifyClient):
def create_chat_message(self, inputs, query, user, response_mode="blocking", conversation_id=None): def create_chat_message(self, inputs, query, user, response_mode="blocking", conversation_id=None, files=None):
data = { data = {
"inputs": inputs, "inputs": inputs,
"query": query, "query": query,
"user": user, "user": user,
"response_mode": response_mode "response_mode": response_mode,
"files": files
} }
if conversation_id: if conversation_id:
data["conversation_id"] = conversation_id data["conversation_id"] = conversation_id
return self._send_request("POST", "/chat-messages", data, stream=True if response_mode == "streaming" else False) return self._send_request("POST", "/chat-messages", data,
stream=True if response_mode == "streaming" else False)
def get_conversation_messages(self, user, conversation_id=None, first_id=None, limit=None): def get_conversation_messages(self, user, conversation_id=None, first_id=None, limit=None):
params = {"user": user} params = {"user": user}

View File

@ -5,7 +5,7 @@ with open("README.md", "r", encoding="utf-8") as fh:
setup( setup(
name="dify-client", name="dify-client",
version="0.1.8", version="0.1.10",
author="Dify", author="Dify",
author_email="hello@dify.ai", author_email="hello@dify.ai",
description="A package for interacting with the Dify Service-API", description="A package for interacting with the Dify Service-API",

View File

@ -12,15 +12,33 @@ class TestChatClient(unittest.TestCase):
def test_create_chat_message(self): def test_create_chat_message(self):
response = self.chat_client.create_chat_message({}, "Hello, World!", "test_user") response = self.chat_client.create_chat_message({}, "Hello, World!", "test_user")
self.assertIn("message_id", response) self.assertIn("answer", response.text)
def test_create_chat_message_with_vision_model_by_remote_url(self):
files = [{
"type": "image",
"transfer_method": "remote_url",
"url": "your_image_url"
}]
response = self.chat_client.create_chat_message({}, "Describe the picture.", "test_user", files=files)
self.assertIn("answer", response.text)
def test_create_chat_message_with_vision_model_by_local_file(self):
files = [{
"type": "image",
"transfer_method": "local_file",
"upload_file_id": "your_file_id"
}]
response = self.chat_client.create_chat_message({}, "Describe the picture.", "test_user", files=files)
self.assertIn("answer", response.text)
def test_get_conversation_messages(self): def test_get_conversation_messages(self):
response = self.chat_client.get_conversation_messages("test_user") response = self.chat_client.get_conversation_messages("test_user", "your_conversation_id")
self.assertIsInstance(response, list) self.assertIn("answer", response.text)
def test_get_conversations(self): def test_get_conversations(self):
response = self.chat_client.get_conversations("test_user") response = self.chat_client.get_conversations("test_user")
self.assertIsInstance(response, list) self.assertIn("data", response.text)
class TestCompletionClient(unittest.TestCase): class TestCompletionClient(unittest.TestCase):
@ -28,8 +46,29 @@ class TestCompletionClient(unittest.TestCase):
self.completion_client = CompletionClient(API_KEY) self.completion_client = CompletionClient(API_KEY)
def test_create_completion_message(self): def test_create_completion_message(self):
response = self.completion_client.create_completion_message({}, "What's the weather like today?", "blocking", "test_user") response = self.completion_client.create_completion_message({"query": "What's the weather like today?"},
self.assertIn("message_id", response) "blocking", "test_user")
self.assertIn("answer", response.text)
def test_create_completion_message_with_vision_model_by_remote_url(self):
files = [{
"type": "image",
"transfer_method": "remote_url",
"url": "your_image_url"
}]
response = self.completion_client.create_completion_message(
{"query": "Describe the picture."}, "blocking", "test_user", files)
self.assertIn("answer", response.text)
def test_create_completion_message_with_vision_model_by_local_file(self):
files = [{
"type": "image",
"transfer_method": "local_file",
"upload_file_id": "your_file_id"
}]
response = self.completion_client.create_completion_message(
{"query": "Describe the picture."}, "blocking", "test_user", files)
self.assertIn("answer", response.text)
class TestDifyClient(unittest.TestCase): class TestDifyClient(unittest.TestCase):
@ -37,12 +76,24 @@ class TestDifyClient(unittest.TestCase):
self.dify_client = DifyClient(API_KEY) self.dify_client = DifyClient(API_KEY)
def test_message_feedback(self): def test_message_feedback(self):
response = self.dify_client.message_feedback("test_message_id", 5, "test_user") response = self.dify_client.message_feedback("your_message_id", 'like', "test_user")
self.assertIn("success", response) self.assertIn("success", response.text)
def test_get_application_parameters(self): def test_get_application_parameters(self):
response = self.dify_client.get_application_parameters("test_user") response = self.dify_client.get_application_parameters("test_user")
self.assertIsInstance(response, dict) self.assertIn("user_input_form", response.text)
def test_file_upload(self):
file_path = "your_image_file_path"
file_name = "panda.jpeg"
mime_type = "image/jpeg"
with open(file_path, "rb") as file:
files = {
"file": (file_name, file, mime_type)
}
response = self.dify_client.file_upload("test_user", files)
self.assertIn("name", response.text)
if __name__ == "__main__": if __name__ == "__main__":