""" Example of using the OpenAI entrypoint's rerank API which is compatible with Jina and Cohere https://jina.ai/reranker run: vllm serve BAAI/bge-reranker-base """ import json import requests url = "http://127.0.0.1:8000/rerank" headers = {"accept": "application/json", "Content-Type": "application/json"} data = { "model": "BAAI/bge-reranker-base", "query": "What is the capital of France?", "documents": [ "The capital of Brazil is Brasilia.", "The capital of France is Paris.", "Horses and cows are both animals" ] } response = requests.post(url, headers=headers, json=data) # Check the response if response.status_code == 200: print("Request successful!") print(json.dumps(response.json(), indent=2)) else: print(f"Request failed with status code: {response.status_code}") print(response.text)