mirror of https://github.com/vllm-project/vllm
35 lines
899 B
Python
35 lines
899 B
Python
# SPDX-License-Identifier: Apache-2.0
|
|
"""
|
|
Example of using the OpenAI entrypoint's rerank API which is compatible with
|
|
Jina and Cohere https://jina.ai/reranker
|
|
|
|
run: vllm serve BAAI/bge-reranker-base
|
|
"""
|
|
import json
|
|
|
|
import requests
|
|
|
|
url = "http://127.0.0.1:8000/rerank"
|
|
|
|
headers = {"accept": "application/json", "Content-Type": "application/json"}
|
|
|
|
data = {
|
|
"model":
|
|
"BAAI/bge-reranker-base",
|
|
"query":
|
|
"What is the capital of France?",
|
|
"documents": [
|
|
"The capital of Brazil is Brasilia.",
|
|
"The capital of France is Paris.", "Horses and cows are both animals"
|
|
]
|
|
}
|
|
response = requests.post(url, headers=headers, json=data)
|
|
|
|
# Check the response
|
|
if response.status_code == 200:
|
|
print("Request successful!")
|
|
print(json.dumps(response.json(), indent=2))
|
|
else:
|
|
print(f"Request failed with status code: {response.status_code}")
|
|
print(response.text)
|