| .. |
|
chart-helm
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
disaggregated_serving
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
disaggregated_serving_p2p_nccl_xpyd
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
elastic_ep
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
opentelemetry
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
prometheus_grafana
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
structured_outputs
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
api_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
cohere_rerank_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
disaggregated_prefill.sh
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
gradio_openai_chatbot_webserver.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
gradio_webserver.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
jinaai_rerank_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
kv_events_subscriber.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
multi-node-serving.sh
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
multi_instance_data_parallel.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_completion_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_completion_client_for_multimodal.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_completion_client_with_tools.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_completion_client_with_tools_required.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_completion_client_with_tools_xlam.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_completion_client_with_tools_xlam_streaming.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_completion_tool_calls_with_reasoning.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_completion_with_reasoning.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_completion_with_reasoning_streaming.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_chat_embedding_client_for_multimodal.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_classification_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_completion_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_cross_encoder_score.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_cross_encoder_score_for_multimodal.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_embedding_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_embedding_matryoshka_fy.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_pooling_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_transcription_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
openai_translation_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
prompt_embed_inference_with_openai_client.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
ray_serve_deepseek.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
retrieval_augmented_generation_with_langchain.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
retrieval_augmented_generation_with_llamaindex.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
run_cluster.sh
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
sagemaker-entrypoint.sh
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
streamlit_openai_chatbot_webserver.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |
|
utils.py
|
first commit
|
2025-08-03 20:28:19 +08:00 |