Directory listing for /vllm/examples/online_serving/
api_client.py
chart-helm/
cohere_rerank_client.py
disaggregated_prefill.sh
disaggregated_serving/
disaggregated_serving_p2p_nccl_xpyd/
elastic_ep/
gradio_openai_chatbot_webserver.py
gradio_webserver.py
jinaai_rerank_client.py
kv_events_subscriber.py
multi-node-serving.sh
multi_instance_data_parallel.py
openai_chat_completion_client.py
openai_chat_completion_client_for_multimodal.py
openai_chat_completion_client_with_tools.py
openai_chat_completion_client_with_tools_required.py
openai_chat_completion_client_with_tools_xlam.py
openai_chat_completion_client_with_tools_xlam_streaming.py
openai_chat_completion_tool_calls_with_reasoning.py
openai_chat_completion_with_reasoning.py
openai_chat_completion_with_reasoning_streaming.py
openai_chat_embedding_client_for_multimodal.py
openai_classification_client.py
openai_completion_client.py
openai_cross_encoder_score.py
openai_cross_encoder_score_for_multimodal.py
openai_embedding_client.py
openai_embedding_long_text/
openai_embedding_matryoshka_fy.py
openai_pooling_client.py
openai_transcription_client.py
openai_translation_client.py
opentelemetry/
prometheus_grafana/
prompt_embed_inference_with_openai_client.py
ray_serve_deepseek.py
retrieval_augmented_generation_with_langchain.py
retrieval_augmented_generation_with_llamaindex.py
run_cluster.sh
sagemaker-entrypoint.sh
streamlit_openai_chatbot_webserver.py
structured_outputs/
utils.py