vllm/vllm_v0.10.0/examples/online_serving
hailin 38d813617c first commit 2025-08-03 20:28:19 +08:00
..
chart-helm first commit 2025-08-03 20:28:19 +08:00
disaggregated_serving first commit 2025-08-03 20:28:19 +08:00
disaggregated_serving_p2p_nccl_xpyd first commit 2025-08-03 20:28:19 +08:00
elastic_ep first commit 2025-08-03 20:28:19 +08:00
opentelemetry first commit 2025-08-03 20:28:19 +08:00
prometheus_grafana first commit 2025-08-03 20:28:19 +08:00
structured_outputs first commit 2025-08-03 20:28:19 +08:00
api_client.py first commit 2025-08-03 20:28:19 +08:00
cohere_rerank_client.py first commit 2025-08-03 20:28:19 +08:00
disaggregated_prefill.sh first commit 2025-08-03 20:28:19 +08:00
gradio_openai_chatbot_webserver.py first commit 2025-08-03 20:28:19 +08:00
gradio_webserver.py first commit 2025-08-03 20:28:19 +08:00
jinaai_rerank_client.py first commit 2025-08-03 20:28:19 +08:00
kv_events_subscriber.py first commit 2025-08-03 20:28:19 +08:00
multi-node-serving.sh first commit 2025-08-03 20:28:19 +08:00
multi_instance_data_parallel.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_completion_client.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_completion_client_for_multimodal.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_completion_client_with_tools.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_completion_client_with_tools_required.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_completion_client_with_tools_xlam.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_completion_client_with_tools_xlam_streaming.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_completion_tool_calls_with_reasoning.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_completion_with_reasoning.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_completion_with_reasoning_streaming.py first commit 2025-08-03 20:28:19 +08:00
openai_chat_embedding_client_for_multimodal.py first commit 2025-08-03 20:28:19 +08:00
openai_classification_client.py first commit 2025-08-03 20:28:19 +08:00
openai_completion_client.py first commit 2025-08-03 20:28:19 +08:00
openai_cross_encoder_score.py first commit 2025-08-03 20:28:19 +08:00
openai_cross_encoder_score_for_multimodal.py first commit 2025-08-03 20:28:19 +08:00
openai_embedding_client.py first commit 2025-08-03 20:28:19 +08:00
openai_embedding_matryoshka_fy.py first commit 2025-08-03 20:28:19 +08:00
openai_pooling_client.py first commit 2025-08-03 20:28:19 +08:00
openai_transcription_client.py first commit 2025-08-03 20:28:19 +08:00
openai_translation_client.py first commit 2025-08-03 20:28:19 +08:00
prompt_embed_inference_with_openai_client.py first commit 2025-08-03 20:28:19 +08:00
ray_serve_deepseek.py first commit 2025-08-03 20:28:19 +08:00
retrieval_augmented_generation_with_langchain.py first commit 2025-08-03 20:28:19 +08:00
retrieval_augmented_generation_with_llamaindex.py first commit 2025-08-03 20:28:19 +08:00
run_cluster.sh first commit 2025-08-03 20:28:19 +08:00
sagemaker-entrypoint.sh first commit 2025-08-03 20:28:19 +08:00
streamlit_openai_chatbot_webserver.py first commit 2025-08-03 20:28:19 +08:00
utils.py first commit 2025-08-03 20:28:19 +08:00