| .. |
|
configs
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
cpu
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
models
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
openai_server
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
double-sparsity-config-Llama-3.1-8B-Instruct.json
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
experiment_runner.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
kv_cache_scales_llama3_1_8b.json
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
kv_cache_scales_llama3_8b.json
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
kv_cache_scales_qwen2_1_5b.json
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
parse_results.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
run_suite.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_abort.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_awq.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_bench_one_batch.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_bench_serving.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_block_int8.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_bnb.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_chunked_prefill.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_create_kvindices.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_custom_allreduce.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_data_parallelism.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_deepep_internode.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_deepep_intranode.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_deepep_low_latency.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_disaggregation.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_disaggregation_different_tp.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_double_sparsity.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_dp_attention.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_eagle_infer_a.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_eagle_infer_b.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_ebnf_constrained.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_eplb.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_eval_accuracy_large.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_eval_fp8_accuracy.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_expert_distribution.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_expert_location_updater.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_fa3.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_fim_completion.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_flashmla.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_fp8_kernel.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_fp8_kvcache.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_full_deepseek_v3.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_function_call_parser.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_fused_moe.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_get_weights_by_name.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_gguf.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_gptqmodel_dynamic.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_health_check.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_hicache.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_hicache_mla.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_hicache_page.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_hidden_states.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_hybrid_dp_ep_tp_mtp.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_input_embeddings.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_int8_kernel.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_io_struct.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_jinja_template_utils.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_kv_events.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_local_attn.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_metrics.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_mla.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_mla_deepseek_v3.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_mla_flashinfer.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_mla_fp8.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_mla_int8_deepseek_v3.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_mla_tp.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_modelopt.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_modelopt_fp8kvcache.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_models_from_modelscope.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_moe_deepep.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_moe_deepep_eval_accuracy_large.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_moe_ep.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_moe_eval_accuracy_large.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_mscclpp.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_nightly_gsm8k_eval.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_nightly_gsm8k_eval_amd.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_no_chunked_prefill.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_no_overlap_scheduler.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_page_size.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_patch_torch.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_penalty.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_pp_single_node.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_pytorch_sampling_backend.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_radix_attention.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_regex_constrained.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_release_memory_occupation.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_retract_decode.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_sagemaker_server.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_schedule_policy.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_score_api.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_server_args.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_session_control.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_skip_tokenizer_init.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_srt_endpoint.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_srt_engine.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_srt_engine_with_quant_args.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_torch_compile.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_torch_compile_moe.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_torch_native_attention_backend.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_torch_tp.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_torchao.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_triton_attention_backend.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_triton_attention_kernels.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_triton_attention_rocm_mla.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_triton_moe_channel_fp8_kernel.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_triton_moe_wna16.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_triton_sliding_window.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_two_batch_overlap.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_update_weights_from_disk.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_update_weights_from_distributed.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_update_weights_from_tensor.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_verl_engine_2_gpu.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_verl_engine_4_gpu.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_vertex_endpoint.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_vision_chunked_prefill.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_vision_openai_server_a.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_vision_openai_server_b.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_vision_openai_server_common.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_vllm_dependency.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_vlm_accuracy.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_vlm_input_format.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |
|
test_w8a8_quantization.py
|
first commit @ sglang v0.4.8.post1
|
2025-06-29 14:14:11 +00:00 |